diff --git a/.env b/.env new file mode 100644 index 00000000..f519e257 --- /dev/null +++ b/.env @@ -0,0 +1,7 @@ +POSTGRES_CONN_ID = alkemy_db +AWS_S3_CONN_ID = aws_s3_bucket +ACCESS_KEY = +SECRET_ACCESS_KEY = +BUCKET = + + diff --git a/.gitignore b/.gitignore new file mode 100644 index 00000000..cceb8540 --- /dev/null +++ b/.gitignore @@ -0,0 +1,44 @@ +.git +.vscode +.env +.ipynb_checkpoints +.code +.astro +Cleandata.ipynb +airflow_settings.yaml +astro +main.py +config.yaml +__pycache__ +airflow_lab.py +airtask.py +example_dag_advanced.py +example_dag_basic.py +hookfunction.py +hookexample.py +/tests +Dockerfile +.dockerignore +packages.txt +docker-compose.yml +docker-compose.override.yml +logging.conf +dac.cfg +/logs +webserver_config.py +airflow.cfg +S3update_dag.py +config_bre.yaml +config_etl.yaml +template_dag.jinja2 +.\Skill-Up-DA-c-PythonG1\.env + +/dags_dynamic/. +./dags/dags_factory +.po.py +nuevo.py +coco.py +po.py +GAUNVillaMaria_dag_etl.py + + diff --git a/README.md b/README.md index 7b4b97b1..9419c6cf 100644 --- a/README.md +++ b/README.md @@ -1,4 +1,5 @@ -# Proyecto #1 Flujos de ejecución + + ## Descripción Client: Ministerio de Educación de la Nación Situación inicial @@ -44,157 +45,9 @@ consultas SQL. códigos postales según requerimientos normalizados que se especifican para cada grupo de universidades, utilizando Pandas. -### Assets 🎨 - - -La base de datos con la información que reunió el Ministerio de Educación se proveerá en el transcurso del proyecto. - - -El archivo auxiliar de códigos postales se encuentra en la carpeta assets. - - -## Requerimientos: -# Airflow usando Docker -https://docs.astronomer.io/software/install-cli?tab=windows#install-the-astro-cli - -## Modulos utilizados en Python -- pathlib -- logging -- pandas -- datetime -- os -- sqlalchemy - -## Estructura y flujo de ejecución - Se generarán archivos ".sql" con las consultas correspondientes a cada centro educativo, normalizando las columnas tenidas en cuenta. - - Mediante operadores disponibles en apache airflow (Python operators y postgre operators, se toman las consultas ".sql" para obtener los datos de la base de datos provista. - - Estos datos se transorman mediante la libreria pandas, y se almacenan en forma local como archivos ".txt". - - Finalmete, a traves de las herramientas provistas por AWS (operadores y hooks S3), los datos almacenados como ".txt" son transformados a strings, y almacenados en el servicio S3. - -# Creación de una Wiki del proyecto -Se recomienda crear una wiki del proyecto en Github para dejar anotaciones, lecciones aprendidas o convenciones necesarias adicionales. - -# **Convención para nombrar carpetas** - -OT000-python - - -airflow - - -assets: archivos complementarios necesarios. - - -dags: para dejar los flujos que se vayan creando - - -datasets: para dejar el archivo resultante del proceso de transformación con Pandas - - -files: para almacenar la extracción de la base de datos. - - -include: para almacenar los SQL. - - -# **Convención para nombrar archivos** -### DAG ETL -Se colocará grupo-letra-siglas de la universidad y localidad, seguido por "_dag_elt.py" para diferenciar de otros csv. - -EJ: GFUNRioCuarto_dag_etl.py - - -# **Convencion para el nombre de la base de datos** - -### conexion con base de datos -se llamara 'alkemy_db' - -### conexion para S3 -se llamara 'aws_s3_bucket' - -### csv generados -Se colocará grupo-letra-siglas de la universidad y localidad, seguido por "_select.csv" para diferenciar el dag realizado. - -EJ: GFUNRioCuarto_select.csv - -### txt generados -Se colocará grupo-letra-siglas de la universidad y localidad, seguido por "_process.txt" para diferenciar el dag realizado. - -EJ: GFUNRioCuarto_process.txt - -# MATERIAL COMPLEMENTARIO - -# AIRFLOW - -https://airflow.apache.org/ - -# Informacion importante de como comenzar con Airflow -https://www.astronomer.io/guides/airflow-sql-tutorial/ - -# Curso de Alkemy de Airflow -https://academy.alkemy.org/curso/python/contenidos/clase-1-introduccion-a-flujos-de-trabajo - -# Guía definitiva de Airflow -[Guia](https://www.astronomer.io/ebooks/dags-definitive-guide.pdf) - -# Airflow Hooks Explained 101 -https://hevodata.com/learn/airflow-hooks/ - -# Create a S3 bucket into AWS. -https://docs.aws.amazon.com/es_es/elastictranscoder/latest/developerguide/gs-2-create-s3-buckets.html - -Create a S3 bucket and call it as you want. - -![image](https://user-images.githubusercontent.com/2921066/194301926-a98e757b-d618-432c-b103-98a2e91a563c.png) - -## Structure of S3 bucket -This is an important part, as I follow a specific folder structure in python scripts. Define the structure as follow: - -![image](https://user-images.githubusercontent.com/2921066/194302089-19e765a9-ef40-4245-9bbc-a53b2f0080e3.png) - -After create the s3 bucket, upload into the folder "preprocess/" the csv file that is located in the root path "talks_info.csv". - -## S3 IAM user -In order to be able to interact with the S3 bucket, we have to create an user (or use an existing one). - -![image](https://user-images.githubusercontent.com/2921066/194302165-2ce84708-2f99-4669-a013-d1ff17558f0f.png) - -## Permissions for the user -Since we have many services and specific permissions to interact with them, we have to assign the S3 permission to the new user. - -![image](https://user-images.githubusercontent.com/2921066/194302244-d96f0220-34f6-4eb2-97cc-05db9fc0d7f2.png) - -## Credentials -This is a very important step. You have to make sure of copy and save the credentials because we will use them later. - -![image](https://user-images.githubusercontent.com/2921066/194302285-47cbb07e-4128-40f3-aabd-0c7c3a276831.png) - -# Instalar providers de amazon -https://airflow.apache.org/docs/apache-airflow-providers-amazon/stable/index.html -# Documentacion de amazon s3 en airflow -https://airflow.apache.org/docs/apache-airflow-providers-amazon/stable/_api/airflow/providers/amazon/aws/hooks/s3/index.html - - -# From Local Filesystem to Amazon S3 -https://airflow.apache.org/docs/apache-airflow-providers-amazon/stable/operators/transfer/local_to_s3.html - -## Quickstart AWS SDK for Python. -https://boto3.amazonaws.com/v1/documentation/api/latest/guide/quickstart.html - - -## How to use Boto3 to upload files to an S3 Bucket? -https://www.learnaws.org/2022/07/13/boto3-upload-files-s3/ - - -# Airflow Dynamic DAGs: The powerful way with Jinja and YAML -https://www.youtube.com/watch?v=HuMgMTHrkn4&ab_channel=DatawithMarc - -# Dynamically Generating DAGs in Airflow -https://www.astronomer.io/guides/dynamically-generating-dags/ - -# Loggers - -# Configuración del archivo de logger.cfg -https://docs.python.org/3/library/logging.config.html#logging-config-fileformat -# Ejemplo de archivo de configuración -https://realpython.com/lessons/logger-config-file/ +## Integrantes y grupos asignados +- [Di Paola, Matias](https://github.com/dipaolme) - Grupo A +- [Breyner Ocampo Cardenas](https://github.com/BROC95) - Grupo B diff --git a/assets/GBUNComahue_dag_elt.cfg b/assets/GBUNComahue_dag_elt.cfg new file mode 100644 index 00000000..fdd56033 --- /dev/null +++ b/assets/GBUNComahue_dag_elt.cfg @@ -0,0 +1,41 @@ +[loggers] +keys=root,GBUNComahue_dag_elt + +[handlers] +keys=consoleHandler + +[formatters] +keys=detailedFormatter + +[logger_root] +level=DEBUG +handlers=consoleHandler + +[logger_GBUNComahue_dag_elt] +level=DEBUG +handlers=consoleHandler +qualname=GBUNComahue_dag_elt +propagate=0 + +[handler_consoleHandler] +class=StreamHandler +level=DEBUG +formatter=detailedFormatter +args=(sys.stdout,) + +[handler_simpleHandler] +formatter=simpleFormatter +class=handlers.RotatingFileHandler +maxBytes=31457280 +level=DEBUG +args=('/tmp/test.log',) + + +[formatter_detailedFormatter] +# format=%(asctime)s - %(name)s - %(levelname)s / %(message)s +format=%(asctime)s - %(name)s - %(message)s +datefmt='%Y-%m-%d' + + + + diff --git a/assets/GBUNSalvador_dag_elt.cfg b/assets/GBUNSalvador_dag_elt.cfg new file mode 100644 index 00000000..2713a846 --- /dev/null +++ b/assets/GBUNSalvador_dag_elt.cfg @@ -0,0 +1,41 @@ +[loggers] +keys=root,GBUNSalvador_dag_elt + +[handlers] +keys=consoleHandler + +[formatters] +keys=detailedFormatter + +[logger_root] +level=DEBUG +handlers=consoleHandler + +[logger_GBUNSalvador_dag_elt] +level=DEBUG +handlers=consoleHandler +qualname=GBUNSalvador_dag_elt +propagate=0 + +[handler_consoleHandler] +class=StreamHandler +level=DEBUG +formatter=detailedFormatter +args=(sys.stdout,) + +[handler_simpleHandler] +formatter=simpleFormatter +class=handlers.RotatingFileHandler +maxBytes=31457280 +level=DEBUG +args=('/tmp/test.log',) + + +[formatter_detailedFormatter] +# format=%(asctime)s - %(name)s - %(levelname)s / %(message)s +format=%(asctime)s - %(name)s - %(message)s +datefmt='%Y-%m-%d' + + + + diff --git a/assets/dag-factory.png b/assets/dag-factory.png new file mode 100644 index 00000000..89369ef5 Binary files /dev/null and b/assets/dag-factory.png differ diff --git a/assets/notebooks/GrupoB.ipynb b/assets/notebooks/GrupoB.ipynb new file mode 100644 index 00000000..13639010 --- /dev/null +++ b/assets/notebooks/GrupoB.ipynb @@ -0,0 +1,7519 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "id": "b2a3f348", + "metadata": {}, + "source": [ + "# Broc95\n", + "\n", + "Proyecto ETL, se desarrollo un proyecto de data, en el cúal se debe extraer, transformar y cargar, información de las principales universidades de Argentina, se utilizo airflow con el manejo de dags, la extracción se realizo sobre una base de datos postgres, la transformación y análisis se realizo con pandas, por otro lado la carga se realizo en un bucket de amazon S3." + ] + }, + { + "cell_type": "markdown", + "id": "f70830ec", + "metadata": {}, + "source": [ + "# Dag factory grupo B\n" + ] + }, + { + "cell_type": "markdown", + "id": "50464330", + "metadata": {}, + "source": [ + "" + ] + }, + { + "cell_type": "code", + "execution_count": 155, + "id": "59772ffd", + "metadata": {}, + "outputs": [], + "source": [ + "import pandas as pd\n", + "import matplotlib.pyplot as plt \n", + "from matplotlib.backends.backend_agg import FigureCanvasAgg as FigureCanvas\n", + "from matplotlib.figure import Figure\n", + "import numpy as np\n", + "import seaborn as sns\n", + "import requests " + ] + }, + { + "cell_type": "code", + "execution_count": 104, + "id": "f2703e2e", + "metadata": {}, + "outputs": [], + "source": [ + "import random\n", + "def hexAl():\n", + " color = [\"#\"+''.join([random.choice('0123456789ABCDEF') for j in range(6)])]\n", + "# print(color)\n", + " return color[0]\n", + "def grafLocation(df):\n", + " corrloc =df.groupby(df.location).count()\n", + " c4=corrloc.university>5\n", + " n =corrloc[c4]\n", + " colores = [hexAl() for i in range(len(n))]\n", + " corrloc[c4].university.plot(kind=\"bar\", color = colores,fontsize=20)\n", + " plt.title(f'Inscription by {df.location.name} > 5 in {df.university[0]}', fontsize=15)\n", + " plt.show()\n", + " ma= corrloc[c4]\n", + " ma.index\n", + " ma.max()\n", + " f =ma.age == ma.age.max()\n", + " name_L=ma[f].index[0]\n", + " loca =df1.location == ma[f].index[0]\n", + " grupoL =df1[loca]\n", + " N = len(grupoL)\n", + " colores = [hexAl() for i in range(N)]\n", + " grupoL.university.groupby(grupoL.inscmonth).count().plot(kind=\"bar\",color = colores,fontsize=20)\n", + " plt.title(f'Inscription by {df.location.name} > 5 in {df.university[0]} by {df.inscmonth.name}', fontsize=15)\n", + " plt.show()\n", + " grafBar(grupoL.career, name_L)\n", + " grafBar(grupoL.age, name_L)\n", + " grafBox(grupoL.gender,grupoL.age, name_L)\n", + " grafPie(grupoL,grupoL.age, name_L)\n", + " grafPie(grupoL,grupoL.gender, name_L)\n", + " grafPie(grupoL,grupoL.career, name_L)\n", + " graf3Rel(grupoL,grupoL.career,grupoL.age,grupoL.gender)\n", + " \n", + " \n", + " \n", + "def grafPie(dfD,dfg,location=\"\"):\n", + " total_precio = dfD.groupby(dfg).count()\n", + " colors = sns.color_palette('pastel')[0:6]\n", + " co = total_precio.columns[0]\n", + " plt.pie(total_precio[co],labels=total_precio.index, colors = colors,\n", + " autopct='%.0f%%')\n", + " plt.title(f\"Inscription by {dfg.name}: {location}\")\n", + " plt.show()\n", + "\n", + "# total_precio = dfD.groupby(dfg).count()\n", + "# print(total_precio)\n", + "# etiquetas = total_precio.index()\n", + "# # print()\n", + "# colors = sns.color_palette('pastel')[0:6]\n", + "# plt.pie(total_precio, labels = etiquetas, colors = colors,\n", + "# autopct='%.0f%%')\n", + "# plt.title(f\"Inscription by {dfg.name}: {location}\")\n", + "# plt.show()\n", + " \n", + "\n", + " \n", + "def grafBar(data,location=\"\"):\n", + " fig = plt.figure(figsize = (10,5))\n", + " plt.title(f\"Inscription by {data.name}: {location}\")\n", + " sns.countplot(data, order = data.value_counts().index)\n", + " plt.xticks(rotation=90)\n", + " plt.show()\n", + "\n", + "\n", + " \n", + "def graf3Rel(df,xd,yd,zd):\n", + " \n", + " sns.relplot(x=xd ,y=yd,hue=zd,data=df)\n", + " plt.title(f\"Inscription by {df.university.unique()[0]}\")\n", + " plt.xticks(rotation=90)\n", + " plt.show()\n", + "\n", + " \n", + "def grafBox(var1,var2, location=\"\"):\n", + " plt.title(f\"Inscription by {var1.name}:{var2.name}:{location}\")\n", + " sns.boxplot(x=var1,y=var2)\n", + " plt.xticks(rotation=90)\n", + " plt.show()\n", + " \n", + " \n", + "def url_todf(url):\n", + " df = pd.read_html(url)\n", + " df =df[0][1]\n", + " df =df.str.split(\"\\t\")\n", + " li =df.to_list()\n", + " df1 = pd.DataFrame(li[1:],columns=li[0])\n", + " return df1" + ] + }, + { + "cell_type": "code", + "execution_count": 105, + "id": "596e9b46", + "metadata": {}, + "outputs": [], + "source": [ + "url1 = \"https://github.com/dipaolme/Skill-Up-DA-c-Python/blob/grupoB/datasets/GBUNComahue_process.txt\"\n", + "url2 = \"https://github.com/dipaolme/Skill-Up-DA-c-Python/blob/grupoB/datasets/GBUNSalvador_process.txt\"\n", + "\n", + "df1 = url_todf(url1)\n", + "df2 = url_todf(url2)\n", + "\n" + ] + }, + { + "cell_type": "code", + "execution_count": 106, + "id": "28af32af", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
universitycareerinscription_datefirst_namelast_namegenderagepostal_codelocationemail
0universidad del salvadorlicenciatura en ciencias de la computación2020-09-01caroldoylefemale373254colonia la blanquitaanthony88@gmail.com
1universidad del salvadorlicenciatura en ciencias antropológicas2020-09-01heiditranfemale278514laguna del barrotodd44@hotmail.com
2universidad del salvadorlicenciatura en planificación y diseño del pai...2020-09-01rachaelharringtonfemale237243antonio carbonizcantrell@yahoo.com
3universidad del salvadorlicenciatura en kinesiología y fisiatría2020-09-01ryansilvamale195272comandante lealheather60@gmail.com
4universidad del salvadoringeniería mecánica2020-09-01tiffanyknightfemale296533alfredo demarchibwarner@gmail.com
.................................
1899universidad del salvadorlicenciatura en sociología2021-02-01melissamcclurefemale336339cailomutarickey75@gmail.com
1900universidad del salvadoringeniería mecánica2021-02-01michaelmosesmale312703cabo san ferminlaura79@hotmail.com
1901universidad del salvadorlicenciatura en kinesiología y fisiatría2021-02-01lisajohnsonfemale297637la dulceabigail27@yahoo.com
1902universidad del salvadorlicenciatura en producción de bioimagenes2021-02-01pamelaclarkfemale191618ricardo rojaswilliam03@hotmail.com
1903universidad del salvadoringeniería en informática2021-02-01reneewalkerfemale211815escuela agricola don boscocbrown@yahoo.com
\n", + "

1904 rows × 10 columns

\n", + "
" + ], + "text/plain": [ + " university \\\n", + "0 universidad del salvador \n", + "1 universidad del salvador \n", + "2 universidad del salvador \n", + "3 universidad del salvador \n", + "4 universidad del salvador \n", + "... ... \n", + "1899 universidad del salvador \n", + "1900 universidad del salvador \n", + "1901 universidad del salvador \n", + "1902 universidad del salvador \n", + "1903 universidad del salvador \n", + "\n", + " career inscription_date \\\n", + "0 licenciatura en ciencias de la computación 2020-09-01 \n", + "1 licenciatura en ciencias antropológicas 2020-09-01 \n", + "2 licenciatura en planificación y diseño del pai... 2020-09-01 \n", + "3 licenciatura en kinesiología y fisiatría 2020-09-01 \n", + "4 ingeniería mecánica 2020-09-01 \n", + "... ... ... \n", + "1899 licenciatura en sociología 2021-02-01 \n", + "1900 ingeniería mecánica 2021-02-01 \n", + "1901 licenciatura en kinesiología y fisiatría 2021-02-01 \n", + "1902 licenciatura en producción de bioimagenes 2021-02-01 \n", + "1903 ingeniería en informática 2021-02-01 \n", + "\n", + " first_name last_name gender age postal_code \\\n", + "0 carol doyle female 37 3254 \n", + "1 heidi tran female 27 8514 \n", + "2 rachael harrington female 23 7243 \n", + "3 ryan silva male 19 5272 \n", + "4 tiffany knight female 29 6533 \n", + "... ... ... ... .. ... \n", + "1899 melissa mcclure female 33 6339 \n", + "1900 michael moses male 31 2703 \n", + "1901 lisa johnson female 29 7637 \n", + "1902 pamela clark female 19 1618 \n", + "1903 renee walker female 21 1815 \n", + "\n", + " location email \n", + "0 colonia la blanquita anthony88@gmail.com \n", + "1 laguna del barro todd44@hotmail.com \n", + "2 antonio carboni zcantrell@yahoo.com \n", + "3 comandante leal heather60@gmail.com \n", + "4 alfredo demarchi bwarner@gmail.com \n", + "... ... ... \n", + "1899 cailomuta rickey75@gmail.com \n", + "1900 cabo san fermin laura79@hotmail.com \n", + "1901 la dulce abigail27@yahoo.com \n", + "1902 ricardo rojas william03@hotmail.com \n", + "1903 escuela agricola don bosco cbrown@yahoo.com \n", + "\n", + "[1904 rows x 10 columns]" + ] + }, + "execution_count": 106, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df2" + ] + }, + { + "cell_type": "code", + "execution_count": 84, + "id": "e7f8f962", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": 67, + "id": "9848956e", + "metadata": {}, + "outputs": [], + "source": [ + "# data =\"GBUNComahue_process.txt\"\n", + "\n", + "# df = pd.read_csv(data,sep=\"\\t\")\n", + "\n", + "\n", + "# df.career" + ] + }, + { + "cell_type": "code", + "execution_count": 107, + "id": "4491ad1d", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
universitycareerinscription_datefirst_namelast_namegenderagepostal_codelocationemailinscmonth
0universidad del salvadorlicenciatura en ciencias de la computación2020-09-01caroldoylefemale373254colonia la blanquitaanthony88@gmail.com2020-09-30
1universidad del salvadorlicenciatura en ciencias antropológicas2020-09-01heiditranfemale278514laguna del barrotodd44@hotmail.com2020-09-30
2universidad del salvadorlicenciatura en planificación y diseño del pai...2020-09-01rachaelharringtonfemale237243antonio carbonizcantrell@yahoo.com2020-09-30
3universidad del salvadorlicenciatura en kinesiología y fisiatría2020-09-01ryansilvamale195272comandante lealheather60@gmail.com2020-09-30
4universidad del salvadoringeniería mecánica2020-09-01tiffanyknightfemale296533alfredo demarchibwarner@gmail.com2020-09-30
....................................
1899universidad del salvadorlicenciatura en sociología2021-02-01melissamcclurefemale336339cailomutarickey75@gmail.com2021-02-28
1900universidad del salvadoringeniería mecánica2021-02-01michaelmosesmale312703cabo san ferminlaura79@hotmail.com2021-02-28
1901universidad del salvadorlicenciatura en kinesiología y fisiatría2021-02-01lisajohnsonfemale297637la dulceabigail27@yahoo.com2021-02-28
1902universidad del salvadorlicenciatura en producción de bioimagenes2021-02-01pamelaclarkfemale191618ricardo rojaswilliam03@hotmail.com2021-02-28
1903universidad del salvadoringeniería en informática2021-02-01reneewalkerfemale211815escuela agricola don boscocbrown@yahoo.com2021-02-28
\n", + "

1904 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " university \\\n", + "0 universidad del salvador \n", + "1 universidad del salvador \n", + "2 universidad del salvador \n", + "3 universidad del salvador \n", + "4 universidad del salvador \n", + "... ... \n", + "1899 universidad del salvador \n", + "1900 universidad del salvador \n", + "1901 universidad del salvador \n", + "1902 universidad del salvador \n", + "1903 universidad del salvador \n", + "\n", + " career inscription_date \\\n", + "0 licenciatura en ciencias de la computación 2020-09-01 \n", + "1 licenciatura en ciencias antropológicas 2020-09-01 \n", + "2 licenciatura en planificación y diseño del pai... 2020-09-01 \n", + "3 licenciatura en kinesiología y fisiatría 2020-09-01 \n", + "4 ingeniería mecánica 2020-09-01 \n", + "... ... ... \n", + "1899 licenciatura en sociología 2021-02-01 \n", + "1900 ingeniería mecánica 2021-02-01 \n", + "1901 licenciatura en kinesiología y fisiatría 2021-02-01 \n", + "1902 licenciatura en producción de bioimagenes 2021-02-01 \n", + "1903 ingeniería en informática 2021-02-01 \n", + "\n", + " first_name last_name gender age postal_code \\\n", + "0 carol doyle female 37 3254 \n", + "1 heidi tran female 27 8514 \n", + "2 rachael harrington female 23 7243 \n", + "3 ryan silva male 19 5272 \n", + "4 tiffany knight female 29 6533 \n", + "... ... ... ... .. ... \n", + "1899 melissa mcclure female 33 6339 \n", + "1900 michael moses male 31 2703 \n", + "1901 lisa johnson female 29 7637 \n", + "1902 pamela clark female 19 1618 \n", + "1903 renee walker female 21 1815 \n", + "\n", + " location email inscmonth \n", + "0 colonia la blanquita anthony88@gmail.com 2020-09-30 \n", + "1 laguna del barro todd44@hotmail.com 2020-09-30 \n", + "2 antonio carboni zcantrell@yahoo.com 2020-09-30 \n", + "3 comandante leal heather60@gmail.com 2020-09-30 \n", + "4 alfredo demarchi bwarner@gmail.com 2020-09-30 \n", + "... ... ... ... \n", + "1899 cailomuta rickey75@gmail.com 2021-02-28 \n", + "1900 cabo san fermin laura79@hotmail.com 2021-02-28 \n", + "1901 la dulce abigail27@yahoo.com 2021-02-28 \n", + "1902 ricardo rojas william03@hotmail.com 2021-02-28 \n", + "1903 escuela agricola don bosco cbrown@yahoo.com 2021-02-28 \n", + "\n", + "[1904 rows x 11 columns]" + ] + }, + "execution_count": 107, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "dfg=pd.get_dummies(data=df1, columns=['gender'])\n", + "\n", + "# dfk = pd.DataFrame(pd.date_range('2000-01-02', freq='1M', periods=15), columns=['Date'])\n", + "df1.inscription_date =pd.to_datetime(df1['inscription_date'], format='%Y-%m-%d')\n", + "bins_dt = pd.date_range('2020-08-01' , freq='1M', periods=7)\n", + "bins_str = bins_dt.astype(str).values\n", + "labels = ['{}'.format( bins_str[i]) for i in range(1, len(bins_str))]\n", + "df1['inscmonth']=pd.cut(df1.inscription_date,\n", + " bins=bins_dt,\n", + " labels=labels)\n", + "\n", + "df1\n", + "dfg['inscmonth']=pd.cut(df1.inscription_date,\n", + " bins=bins_dt,\n", + " labels=labels)\n", + "\n", + "\n", + "dft=pd.get_dummies(data=df2, columns=['gender'])\n", + "\n", + "# dfk = pd.DataFrame(pd.date_range('2000-01-02', freq='1M', periods=15), columns=['Date'])\n", + "df2.inscription_date =pd.to_datetime(df2['inscription_date'], format='%Y-%m-%d')\n", + "bins_dt = pd.date_range('2020-08-01' , freq='1M', periods=7)\n", + "bins_str = bins_dt.astype(str).values\n", + "labels = ['{}'.format( bins_str[i]) for i in range(1, len(bins_str))]\n", + "df2['inscmonth']=pd.cut(df2.inscription_date,\n", + " bins=bins_dt,\n", + " labels=labels)\n", + "\n", + "df1\n", + "dft['inscmonth']=pd.cut(df2.inscription_date,\n", + " bins=bins_dt,\n", + " labels=labels)\n", + "df2" + ] + }, + { + "cell_type": "code", + "execution_count": 108, + "id": "cbf6041f", + "metadata": {}, + "outputs": [], + "source": [ + "\n", + "# df3=pd.get_dummies(data=df1, columns=['career','gender','location'])\n", + "\n", + "dfc=dfg.groupby(['career']).mean()\n", + "dfc=dfg.groupby(['career']).count()\n", + "dfa=dfg.groupby(['age']).count()\n", + "dfl=dfg.groupby(['location']).mean()\n", + "dfI=dfg.groupby(['inscription_date']).mean()\n", + "\n", + "dfcp = df1.groupby(df1.postal_code).count()\n", + "\n", + "dfc\n", + "\n", + "dfc =dfg.university.groupby(df1.career).count()\n", + "# dfc" + ] + }, + { + "cell_type": "code", + "execution_count": 114, + "id": "15a0f397", + "metadata": {}, + "outputs": [], + "source": [ + "# dfcg =df1.university.groupby([df1.career,df1.gender,df1.age]).count().plot(kind=\"bar\")\n", + "\n", + "df1.age = df1.age.astype(int)\n", + "df2.age = df2.age.astype(int)" + ] + }, + { + "cell_type": "code", + "execution_count": 113, + "id": "c8d9d53b", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "university object\n", + "career object\n", + "inscription_date datetime64[ns]\n", + "first_name object\n", + "last_name object\n", + "gender object\n", + "age int32\n", + "postal_code object\n", + "location object\n", + "email object\n", + "inscmonth category\n", + "dtype: object" + ] + }, + "execution_count": 113, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df1.dtypes" + ] + }, + { + "cell_type": "markdown", + "id": "1244b609", + "metadata": {}, + "source": [ + "# General\n", + "## Comportamiento por universidad\n", + "\n", + "Grafícas de barras, pie, relación a 3 variables , para cada universidad \n", + "\n", + "\n", + "# Univerdidad Grupo B Comahue" + ] + }, + { + "cell_type": "code", + "execution_count": 153, + "id": "376176e7", + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "iVBORw0KGgoAAAANSUhEUgAAAmQAAAFPCAYAAADjktLUAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjQuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8rg+JYAAAACXBIWXMAAAsTAAALEwEAmpwYAAAnK0lEQVR4nO3debgkZXn38e8PRlBUZJkRZXMI4IJbxAlqjJFXTARUQCQKEQVER42CviFu0TeoESUa4xIjBmV1Y1OWuCtqjAvLsMiuIrIMsoxsorgEud8/qo42hzMzh+murnPmfD/X1depfp6qu+6uqu6+z1PV3akqJEmS1J81+k5AkiRprrMgkyRJ6pkFmSRJUs8syCRJknpmQSZJktQzCzJJkqSeWZBJHUpycZLtV3HZzZP8Msmao80KklSSrUYdd7ZI8qUk+/Sdx1SGOWbuxToWtsfAvGnOf3SSd05z3iuTPHO4DLtzbx6LNE7TejJKq4MkVwIvq6qvj2udVfXo6c47Ob+quhp4QEepzWlVtVPfOSzPvTlmJK0+HCGTOjDdkQdJksCCTHNUkn2TfCfJvya5JclPk+w0qf+KJLe3fS8a6Ht5kkvbvkuSbNu2X5nkjUkuAH6VZN7g6Zskb0tyUpLj22XPTfL4tu8TwObAf7WnKd8w+bRSko2TnJbk5iSXJ3n5QE5vS3JCkmPb2BcnWbSSzbBz+xh/nuS9SdZIslYb/7EDsR+c5I4kC6bYjlsm+UaSm9o4n0qy3kD/tknOa3M6sX3s7xzof06S85PcmuR7SR43zf13j1NuSb6V5GUD+29F+/dbSV6WZO123Y8Z6FuQ5NdJHrySHFa4zZO8KclPBo6T501afkXH0cQxs3aSDyT5WXv7QJK1277tkyxNclCSG5Ncl2S/gfjPbrf9L5Jck+Rt09m27bJPaI/P25McD9x3Uv+q7rf7JXlfkquS3Nbuo/u1fbu02/DWdv88amC5K5O8PskFSX6V5IgkG6U59Xx7kq8nWX9g/hOTXN+u49tJJo86rp/kC+2yZybZsl1uhcdVe/+l7X67JclXkjxsuttVWhELMs1lTwJ+CMwH3gMckcb9gQ8BO1XVA4E/B84HSPI3wNuAlwDrArsANw3E3At4NrBeVd05xTp3BU4ENgA+DZyS5D5V9WLgauC5VfWAqnrPFMseBywFNgb2AN6V5BkD/bu086wHnAZ8eCWP/3nAImDbNq+XVtXv2hh7T3pMp1fVsiliBHh3m9OjgM1otg9J1gJOBo5uH+9n2nXS9j8BOBJ4BbAh8J/AaQMFx0eSfGQlj2FFpty/gzNU1W+Bz7WPccILgP+uqhunsY4VbfOfAE8DHgS8HfhkkofCtI6jCW8Bngz8KfB4YDvgrQP9D2njbwLsD/zHQGHyqzb+ejTH5KuS7LayB9Tut1OAT9DstxOB5w/0r3C/rcS/Ak+keU5tALwBuCvJw2mOj9cBC4Av0vxzstbAss8H/gp4OPBc4EvAP7bzrwEcODDvl4CtgQcD5wKfmpTHnjT7ZH3gcuCQaeROkl3bde7ervd/2ryl4VWVN29z4gZcCTyznd4XuHygbx2gaN7g7g/cSvMGcL9JMb4CvHYF8V+6gnW+DThjoG8N4DrgaZPnbe8vbHOaR1Po/B544ED/u4GjB2J/faBvG+DXK9gWBew4cP/vaIouaAqZq4G095cAL5jmNt4NOK+d/kvg2ok4bdt3gHe204cB/zxp+R8CT5/Gev6wbQbavkVzDd4K9+8U8z4T+MnAvN8FXjKNHO7tNj8f2HWax9HEMfMTYOeBvmcBV7bT2wO/nrQNbgSevJy4HwDev7ztNzDfXwI/m7Tfvjfd/cak43jS8f5r4PFT9P0/4IRJ814LbD8Q80UD/Z8FDhu4fwBwynIe93rtY31Qe/9o4OMD/TsDl03zuPoSsP+kPO8AHjad54c3byu6OUKmuez6iYmquqOdfEBV/Qp4IfBK4Lr21MYj2/7NaN4kl+ealazzD/1VdRd/HPFamY2Bm6vq9oG2q2hGRiZcPzB9B3DfrPhatsFcr5rIo6rObJffvn3cW9GM/txDe9rouCTXJvkF8EmaEamJnK+tqlrOOh8GHNSeoro1ya0023c622M6pty/U8z3TWCdJE9KspBmNOrke7sOJm3zJC8ZOK13K/AY/rhtVnYcTdiYZt9M+MN+at1Udx+JvYP2MbaP55tJliW5jeZ4ns/KTbXfBnNY1f02n+bU51SP+26Ps31uXMPdj+8bBqZ/PcX9ice9ZpJD05wu/gVNMTex/gmT99t0PzzzMOCDA4/7ZppR4k1WuJQ0DRZk0hSq6itV9VfAQ4HLgI+1XdcAW65o0ZWE3mxiIskawKY0oxErW/ZnwAZJHjjQtjnNKMKq2mxgevOBPACOoTlt+WLgpKr6zXJivIsm78dW1brtMhOnBa8DNpl0mnBwndcAh1TVegO3dapqOqeAftX+XWeg7SHTWO4equr3wAk0py33Aj4/qfC919rrij4GvAbYsKrWAy7ij9tmZcfRhJ/RFAETJu+nFfk0TSG9WVU9CPjowPpXZKr9tvnA9Krut58Dv2Hqx323x9muezNW7fj+W5pT8M+kOZ27cCLsNJZd2XF1DfCKSY/9flX1vVXIU7obCzJpknbUZ9f2WrLfAr8E7mq7Pw78Q5InttebbXUvL+p9YpLd21GU17Xxz2j7bgD+ZKqFquoamtNG705y3/Yi6v1pRqRW1euTrJ9kM+C1wPEDfZ+kud5rb+DYFcR4IM32uS3JJsDrB/q+T3Oa9TVpPuCwK801UBM+BryyHclJkvunuRB9sOicUjXXs10L7N2OiLyU6RU4y/NpmlHRF7XTw7o/TaG6DCDNxfaPGeif7nH0GeCtaT5oMB/4J6a/zx9IM6r6myTb0RQq0/F94E7gwCT3SbI7I9hv7ajXkcC/pfmAyppJntJee3YC8OwkOyS5D3AQzXNjVQqdB7bL3kRTWL1rugtO47j6KPDmtB8SSPKg9npAaWgWZNI9rQH8Pc1/7TcDTwdeBVBVJ9JcAPxp4Haai583uBexT6V547+FZvRp96r637bv3TRvvrcm+Ycplt2L5r/9n9GcUju4hvtOtVOBc2iubfoCcMRER1sAnktTVPzPCmK8neZDAbe1MT43EON3NBc/709zTd7ewOdp3iypqiXAy2kuhL+F5uLqfSeWT/LRJB9dwbpfTlMA3gQ8mlV7857I9Uya0ZGNaa4Tmsjhl0metgrxLgHeR1Pc3AA8lubatIn+6R5H76S5hu8C4EKafTLdLzX9O+AdSW6nKeROmGbuE/ttX5rj/4Xcfb+ucL+txD/QPI6z29j/AqxRVT+kOT7+nWYk7bk0H3D53TTjDjqW5vTntcAl/PEfnula7nFVVSe3OR/Xng69CJix32mn2WXiol1JHUvztQNbVdXeK5t3JkhyJPCzqnrrSmeefswzgY9W1VGjiilJqwO/vFLSPbQXt+8OPGHIOE+n+QTez2lOBz4O+PKw+UnS6sZTlpLuJsk/05yKeW9V/XTIcI8AfkBzyvIgYI+qum7ImJK02vGUpSRJUs8cIZMkSerZrL6GbP78+bVw4cK+05AkSVqpc8455+dVdY/fBYZZXpAtXLiQJUuW9J2GJEnSSiW5anl9nrKUJEnqmQWZJElSzyzIJEmSemZBJkmS1DMLMkmSpJ5ZkEmSJPXMgkySJKlnFmSSJEk9syCTJEnqmQWZJElSzyzIJEmSejarf8ty0LLDPjmSOAtetfdI4kiSJE2XI2SSJEk9syCTJEnqmQWZJElSzyzIJEmSemZBJkmS1DMLMkmSpJ5ZkEmSJPXMgkySJKlnFmSSJEk9syCTJEnqmQWZJElSzzoryJIcmeTGJBdNaj8gyWVJLk7ynoH2Nye5PMkPkzyrq7wkSZJmmi5/XPxo4MPAsRMNSf4PsCvw+Kr6bZIHt+3bAHsCjwY2Br6e5OFV9fsO85MkSZoROhshq6pvAzdPan4VcGhV/bad58a2fVfguKr6bVX9FLgc2K6r3CRJkmaScV9D9nDgaUnOTPLfSf6sbd8EuGZgvqVt2z0kWZxkSZIly5Yt6zhdSZKk7o27IJsHbAA8GXg9cEKS3JsAVXV4VS2qqkULFizoIkdJkqSxGndBthT4XDXOAu4C5gPXApsNzLdp2yZJkrTaG3dBdgrwfwCSPBxYC/g5cBqwZ5K1k2wBbA2cNebcJEmSetHZpyyTfAbYHpifZClwMHAkcGT7VRi/A/apqgIuTnICcAlwJ/BqP2EpSZLmis4Ksqraazldey9n/kOAQ7rKR5Ikaabym/olSZJ6ZkEmSZLUMwsySZKknlmQSZIk9cyCTJIkqWcWZJIkST2zIJMkSeqZBZkkSVLPLMgkSZJ6ZkEmSZLUs85+Oml1csNh7x1JnI1e9fqRxJEkSasXR8gkSZJ6ZkEmSZLUM09Z9uzqD+0xslibH3jSyGJJkqTxcYRMkiSpZxZkkiRJPfOU5Wrs7P987shi/dkr/mtksSRJ0t05QiZJktQzCzJJkqSeecpSq+wrR+w8kjjP2v+LI4kjSdJs5QiZJElSzyzIJEmSetZZQZbkyCQ3Jrloir6DklSS+e39JPlQksuTXJBk267ykiRJmmm6HCE7GthxcmOSzYC/Bq4eaN4J2Lq9LQYO6zAvSZKkGaWzgqyqvg3cPEXX+4E3ADXQtitwbDXOANZL8tCucpMkSZpJxnoNWZJdgWur6geTujYBrhm4v7RtmyrG4iRLkixZtmxZR5lKkiSNz9gKsiTrAP8I/NMwcarq8KpaVFWLFixYMJrkJEmSejTO7yHbEtgC+EESgE2Bc5NsB1wLbDYw76ZtmyRJ0mpvbCNkVXVhVT24qhZW1UKa05LbVtX1wGnAS9pPWz4ZuK2qrhtXbpIkSX3q8msvPgN8H3hEkqVJ9l/B7F8ErgAuBz4G/F1XeUmSJM00nZ2yrKq9VtK/cGC6gFd3lYskSdJM5m9ZakY6/qh7fIXdKnnhfl8eSRxJkrrkTydJkiT1zIJMkiSpZxZkkiRJPbMgkyRJ6pkFmSRJUs8syCRJknpmQSZJktQzCzJJkqSeWZBJkiT1zIJMkiSpZxZkkiRJPfO3LDXn/OcnnjWyWK948VdGFkuSNHc5QiZJktQzCzJJkqSeWZBJkiT1zIJMkiSpZ17UL43QIceP7gMDb3nhPT8wsN/JO44k9lHP+/JI4kiSRsMRMkmSpJ5ZkEmSJPXMgkySJKlnnV1DluRI4DnAjVX1mLbtvcBzgd8BPwH2q6pb2743A/sDvwcOrCq/cVMao51POWgkcb642/tGEkeS5pIuR8iOBiZfgfw14DFV9TjgR8CbAZJsA+wJPLpd5iNJ1uwwN0mSpBmjsxGyqvp2koWT2r46cPcMYI92elfguKr6LfDTJJcD2wHf7yo/SePz7JPfO7JYX3je60cWS5Jmij6/9uKlwPHt9CY0BdqEpW3bPSRZDCwG2HzzzbvMT9Is8OzPHj6yWF94/uKRxZKke6OXi/qTvAW4E/jUvV22qg6vqkVVtWjBggWjT06SJGnMxj5ClmRfmov9d6iqapuvBTYbmG3Ttk2SJGm1N9YRsiQ7Am8AdqmqOwa6TgP2TLJ2ki2ArYGzxpmbJElSX7r82ovPANsD85MsBQ6m+VTl2sDXkgCcUVWvrKqLk5wAXEJzKvPVVfX7rnKTJEmaSbr8lOVeUzQfsYL5DwEO6SofSZKkmcpv6pckSeqZBZkkSVLPLMgkSZJ6ZkEmSZLUMwsySZKknlmQSZIk9cyCTJIkqWcWZJIkST2zIJMkSeqZBZkkSVLPLMgkSZJ6ZkEmSZLUMwsySZKknlmQSZIk9cyCTJIkqWcWZJIkST2zIJMkSeqZBZkkSVLPLMgkSZJ6ZkEmSZLUMwsySZKknlmQSZIk9ayzgizJkUluTHLRQNsGSb6W5Mft3/Xb9iT5UJLLk1yQZNuu8pIkSZppuhwhOxrYcVLbm4DTq2pr4PT2PsBOwNbtbTFwWId5SZIkzSidFWRV9W3g5knNuwLHtNPHALsNtB9bjTOA9ZI8tKvcJEmSZpJxX0O2UVVd105fD2zUTm8CXDMw39K27R6SLE6yJMmSZcuWdZepJEnSmPR2UX9VFVCrsNzhVbWoqhYtWLCgg8wkSZLGa9wF2Q0TpyLbvze27dcCmw3Mt2nbJkmStNobd0F2GrBPO70PcOpA+0vaT1s+Gbht4NSmJEnSam1eV4GTfAbYHpifZClwMHAocEKS/YGrgBe0s38R2Bm4HLgD2K+rvCRJkmaaaRVkSU6vqh1W1jaoqvZaTtc9lmmvJ3v1dHKRJEla3aywIEtyX2AdmlGu9YG0XeuynE9BSpIk6d5Z2QjZK4DXARsD5/DHguwXwIe7S0uSJGnuWGFBVlUfBD6Y5ICq+vcx5SRJkjSnTOsasqr69yR/DiwcXKaqju0oL0mSpDljuhf1fwLYEjgf+H3bXIAFmSRJ0pCm+7UXi4Bt2k9DSpIkaYSm+8WwFwEP6TIRSZKkuWq6I2TzgUuSnAX8dqKxqnbpJCtJkqQ5ZLoF2du6TEKSJGkum+6nLP+760QkSZLmqul+yvJ2mk9VAqwF3Af4VVWt21VikiRJc8V0R8geODGdJMCuwJO7SkqSJGkume6nLP+gGqcAzxp9OpIkSXPPdE9Z7j5wdw2a7yX7TScZSZIkzTHT/ZTlcwem7wSupDltKUmSpCFN9xqy/bpORJIkaa6a1jVkSTZNcnKSG9vbZ5Ns2nVykiRJc8F0L+o/CjgN2Li9/VfbJkmSpCFNtyBbUFVHVdWd7e1oYEGHeUmSJM0Z0y3Ibkqyd5I129vewE1dJiZJkjRXTLcgeynwAuB64DpgD2DfjnKSJEmaU6ZbkL0D2KeqFlTVg2kKtLev6kqT/N8kFye5KMlnktw3yRZJzkxyeZLjk6y1qvElSZJmk+kWZI+rqlsm7lTVzcATVmWFSTYBDgQWVdVjgDWBPYF/Ad5fVVsBtwD7r0p8SZKk2Wa6BdkaSdafuJNkA6b/pbJTmQfcL8k8YB2a06DPAE5q+48BdhsiviRJ0qwx3aLqfcD3k5zY3v8b4JBVWWFVXZvkX4GrgV8DXwXOAW6tqjvb2ZYCm0y1fJLFwGKAzTfffFVSkCRJmlGmNUJWVccCuwM3tLfdq+oTq7LCdqRtV2ALmu80uz+w43SXr6rDq2pRVS1asMBv3pAkSbPftE87VtUlwCUjWOczgZ9W1TKAJJ8Dngqsl2ReO0q2KXDtCNYlSZI04033GrJRuhp4cpJ1kgTYgabQ+ybN12kA7AOc2kNukiRJYzf2gqyqzqS5eP9c4MI2h8OBNwJ/n+RyYEPgiHHnJkmS1IdhPim5yqrqYODgSc1XANv1kI4kSVKv+jhlKUmSpAEWZJIkST2zIJMkSeqZBZkkSVLPLMgkSZJ6ZkEmSZLUMwsySZKknlmQSZIk9cyCTJIkqWcWZJIkST2zIJMkSeqZBZkkSVLPLMgkSZJ6ZkEmSZLUMwsySZKknlmQSZIk9cyCTJIkqWcWZJIkST2zIJMkSeqZBZkkSVLPLMgkSZJ6ZkEmSZLUs14KsiTrJTkpyWVJLk3ylCQbJPlakh+3f9fvIzdJkqRx62uE7IPAl6vqkcDjgUuBNwGnV9XWwOntfUmSpNXe2AuyJA8C/hI4AqCqfldVtwK7Ase0sx0D7Dbu3CRJkvrQxwjZFsAy4Kgk5yX5eJL7AxtV1XXtPNcDG021cJLFSZYkWbJs2bIxpSxJktSdPgqyecC2wGFV9QTgV0w6PVlVBdRUC1fV4VW1qKoWLViwoPNkJUmSutZHQbYUWFpVZ7b3T6Ip0G5I8lCA9u+NPeQmSZI0dmMvyKrqeuCaJI9om3YALgFOA/Zp2/YBTh13bpIkSX2Y19N6DwA+lWQt4ApgP5ri8IQk+wNXAS/oKTdJkqSx6qUgq6rzgUVTdO0w5lQkSZJ65zf1S5Ik9cyCTJIkqWcWZJIkST2zIJMkSeqZBZkkSVLPLMgkSZJ6ZkEmSZLUMwsySZKknlmQSZIk9cyCTJIkqWcWZJIkST2zIJMkSeqZBZkkSVLPLMgkSZJ6ZkEmSZLUMwsySZKknlmQSZIk9cyCTJIkqWcWZJIkST2zIJMkSeqZBZkkSVLPeivIkqyZ5Lwkn2/vb5HkzCSXJzk+yVp95SZJkjROfY6QvRa4dOD+vwDvr6qtgFuA/XvJSpIkacx6KciSbAo8G/h4ez/AM4CT2lmOAXbrIzdJkqRx62uE7APAG4C72vsbArdW1Z3t/aXAJlMtmGRxkiVJlixbtqzzRCVJkro29oIsyXOAG6vqnFVZvqoOr6pFVbVowYIFI85OkiRp/Ob1sM6nArsk2Rm4L7Au8EFgvSTz2lGyTYFre8hNkiRp7MY+QlZVb66qTatqIbAn8I2qehHwTWCPdrZ9gFPHnZskSVIfZtL3kL0R+Pskl9NcU3ZEz/lIkiSNRR+nLP+gqr4FfKudvgLYrs98JEmS+jCTRsgkSZLmJAsySZKknlmQSZIk9cyCTJIkqWcWZJIkST2zIJMkSeqZBZkkSVLPLMgkSZJ6ZkEmSZLUMwsySZKknlmQSZIk9cyCTJIkqWcWZJIkST2zIJMkSeqZBZkkSVLPLMgkSZJ6ZkEmSZLUMwsySZKknlmQSZIk9Wxe3wlI0kz2nJM+NZI4n9/jRSOJI2n15AiZJElSzyzIJEmSejb2gizJZkm+meSSJBcneW3bvkGSryX5cft3/XHnJkmS1Ic+riG7Ezioqs5N8kDgnCRfA/YFTq+qQ5O8CXgT8MYe8pOksXjuSaeMJM5/7bHbSOJI6s/YR8iq6rqqOredvh24FNgE2BU4pp3tGGC3cecmSZLUh16vIUuyEHgCcCawUVVd13ZdD2y0nGUWJ1mSZMmyZcvGk6gkSVKHeivIkjwA+Czwuqr6xWBfVRVQUy1XVYdX1aKqWrRgwYIxZCpJktStXgqyJPehKcY+VVWfa5tvSPLQtv+hwI195CZJkjRuY7+oP0mAI4BLq+rfBrpOA/YBDm3/njru3CRpdbHbSaePLNYpe+xwt/t7fPbckcU+6fnbjiyWNJv18SnLpwIvBi5Mcn7b9o80hdgJSfYHrgJe0ENukqSeHXjyNSOJ86HnbTaSONI4jL0gq6rvAFlO9w7LaZckSVpt+VuWkqQ54+OfG83lyS/b/cH3aPvS8T8fSWyAnV44f2SxNDtYkEmSNMOdfdToPuf2Z/vds5hU//wtS0mSpJ45QiZJ0hx35QeuH0mcha97yD3arn/fZSOJ/ZCDHjmSODOVI2SSJEk9syCTJEnqmacsJUnSrHTDB78/slgbvfYpI4u1KizIJEmSJrnxw18aWawHv2anlc7jKUtJkqSeWZBJkiT1zIJMkiSpZxZkkiRJPbMgkyRJ6pkFmSRJUs8syCRJknpmQSZJktQzCzJJkqSeWZBJkiT1zIJMkiSpZxZkkiRJPbMgkyRJ6tmMK8iS7Jjkh0kuT/KmvvORJEnq2owqyJKsCfwHsBOwDbBXkm36zUqSJKlbM6ogA7YDLq+qK6rqd8BxwK495yRJktSpVFXfOfxBkj2AHavqZe39FwNPqqrXDMyzGFjc3n0E8MN7sYr5wM9HlO7qErvr+MYef3xjjz++sccf39jjj2/s4eM/rKoWTNUxb3T5jEdVHQ4cvirLJllSVYtGnNKsjt11fGOPP76xxx/f2OOPb+zxxzd2t/Fn2inLa4HNBu5v2rZJkiSttmZaQXY2sHWSLZKsBewJnNZzTpIkSZ2aUacsq+rOJK8BvgKsCRxZVRePcBWrdKpzNY/ddXxjjz++sccf39jjj2/s8cc3dofxZ9RF/ZIkSXPRTDtlKUmSNOdYkEmSJPXMgkySJKlnFmSSJEk9syDTnJdknSRvSPL6JPdNsm+S05K8J8kD+s5PM0uSP0lyZJJ3JnlAko8luSjJiUkW9p3fvZHkwR3G/lFXsQVJ5iV5RZIvJ7mgvX0pySuT3Kfv/FZkNuc+WZINRxVrtS3I2hfKdyS5OMltSZYlOSPJviOI/biB6fskeWv7Bv6uJOsMGftzSfYedyGQZOiP7SbZcWD6QUmOaJ9on06y0bDxO3Q0sBGwBfAFYBHwXiDAYf2ltXJJzm2Pvy3HvN4vDbn8Q5IcluQ/kmyY5G1JLkxyQpKHDhl7jSQvTfKFJD9ot9FxSbYfJu6Ao2m+M/GXwBnAZcBOwJeBI4cJnGRRkm8m+WSSzZJ8rX39OjvJE4aMvcGk24bAWUnWT7LBkLFvT/KL9nZ7ktuBLSfah4ndxl83ybuTfCLJ307q+8iw8bvSvg4emuSyJDcnuSnJpW3bekOG/wTwp8DbgJ3b29uBxwOfHDI2SdZsi6Z/TvLUSX1vHTJ8Z7kneU2S+e30Vkm+neTWJGcmeeyQsQ8diL0oyRXAmUmuSvL0YWIDUFWr5Q04FdiX5tv+/x74f8DWwDHAu4aMfe7A9PtoXqCfDrwfOHbI2NcCJwE3AycAzwPWGtE22WA5tw2BpSOIP7hdPg68E3gY8H+BU4aNDbwV2LKDY+X89m+A6/nj18EEuGAE8R8AvAO4GLgNWEbzRr7vCGL/FPhX4GrgrHZbbzyi7bLtcm5PBK4bMvaXgQOANwEXAG+k+ZWOA4BTh4x9FM0L/V8AH2i3/V8BXwcOGMF2OW9g+url9a1i7LNoiru9gGuAPdr2HYDvDxn7rvZ4Gbz9b/v3iiFjfwg4Ftho8NgcxXHYxvoscCiwG82XhX8WWLvtO3fI2IuAb9IUApsBX2ufp2cDTxgy9lfaY/shA20Padu+OmTsH61K372I/3Hg08DrgHOAfxvoG3abd5Y7cPHA9BeA57XT2wPfHTL2hQPT3wT+rJ1+OLBk6G0+bICZegN+MOn+2e3fNYDLhox93sD0+cB92umh38AnYgPrAi8GvkjzBn4U8NdDxv49cMWkF+SJ+78bwTYfLMjOn9R3/pCxuyw8zh+YPnJFx9Eqxh/XPwdPAz5CU1R+E1g8guPlG22sybdfDxn7vIHpyUXNsMfKBZPun9H+XRu4dAT785z2BXg7mh8UXtS2bzWq5/9ytst5Q8Y+iKYQfuxA20+H3R4DsZ7YHi8Htq+zQxV5KzomgLcA36X5Z3LY4qDLIviHq9I3zdhnAH8DrDHQtgbwQuDMEWzzCwam59F8+enn2ufReTM198HtSvu+P9VjWsXYlwLzJh7DpL4Lh4ldtXoXZN8D/qKd3gX4ylQ7bBVjXwHsDjx/8gs8Q76BT/Xi0r7ovBL4xpCxfwxsvpy+a0awzZfSFBwHtdsoA33DPhG6LDw+DjxgivYtge+MYLt0+c/BVMfLmsCOwFFDxr4I2LqL42VwmwDvnNQ31AsbTcG0ZTu9LfDtgb5LRrA/dwB+2L44/wXNaM2PgRuBXYeM/X3gr9s3q6uA3dr2pzOK/8CbfwpOBP4NeCAjLJra+GvQFGT/A/xshHEvZeDNu23bl2bU+aohY583MD3qIvirwBu4+8jhRjQjZF8fMvZC4Pj2uPtRe7uxbdtiBNv8Hq9NwME0hfCPR5T7sjbvH48qd+AQmrNWfwL8I80I38OA/YDPDxn7gHafPoNmFP6D7XPz7cAnht7mwwaYqTeac9FnAbcA3wEe0bYvAA4cMvZRk24bte0PAU4fMva3h1l+JbFfDTx+OX2jOJVz8KTbgoHtMuyp3M4KjzbWdvxx+HkbmsLy2QwUlUPE7vKfg+M6PF72mHjeTNG325Cx38HURfBWwElDxn4GzUjqj2lGVp/Uti8A3jOibfOkgePl0cA/ADuPIO7jaU5zfQl4ZPuCfytN4fHnI9y3u9CMUlw/wpiDz6GnAf80im3SxnsP8Mwp2ndk+OKgsyIYWB/4F5rrDG+huRTl0rZtgxEdh9vR/NP+1FEdh23sTwI7TtH+MuB/R3jcbNjePjnCmPsCZ9KMYN8OXAK8C3jQCGJvT1M4ngdcSHMWazHtmbJhbqv1TycleRSwCc3Q4i8H2nesqi8PGftJwF1VdXaSbWheGC6rqi8OlXQTezugZlvsNv4jabb5maPc5kmOq6o9R5HjFLEPpjllMY/m+pEn0Yy8/RVN8XTIkPEfRzMKtzXNG+tLq+pHSRYAe1XVh4aM38k2n+WxnwLc2dFzaPLxsh3wLUZ3vDwK2JiOtznNKektq+qiETw/O90mk3OftF12qqpV/pBJksfTFHx30VwK8SpgH5rreV9eVd8bQd6bMuL3oTFt807eL5KcNkXzM2hOeVNVuwwZfzDvR9PkfemInv+dvW6NpBqdiTeaYfPLgFOAKxk4lcDw1xwcTPPf5RLg3cDpNNcFfRt4y4hjf2M2xG7jH0BzKmfk23wl691vyOUvpBltWwf4BbBu234/RnBRf8e5d7bN2+dQV7G7zLuz52fXx0vHr1td7s9On0Oz+LVlNm/zLt+LzqUZgdueZiRye+C6dvrpI857lO/Pne3PqtX7lOWFtKdEaM5XLwFe294/bwSxu3pBnpWxu97mK1nv1UMuf95U0+3987vKe0S5d32cz9bYXR7nnR0vs3ibd7ZNus59Jeudyc/PcWzzrt6L1qAZjfwa8Kdt20iuZ+w4706Pw3msvtaodjixqq5sv4PopCQPo/k05DDurKrfA3ck+UlV/aJdz6+T3DVHY0OH2zzJBcvrorlIdhi/S7JOVd1B80mxiXU+iOY0xlA6zr3L43y2xu76OO/yeJmt27zT5xCz97VlNm/zzp5HVXUX8P4kJ7Z/b4CR1SNdPv+73J+r7xfDAjck+dOJO+1GfA4wHxjqy+Fonwjt9KifCLM1NnS7zTcCXgI8d4rbTUPG/sv2RW3ihWLCfWiuJRlWl7l3uc1na+yuj/Muj5fZus27fg7N1teW2bzNu34eUVVLq+pvaD7EMvSX2ba6zLvL/bn6XtSfZFOaSvn6KfqeWlXfHSL22lX12yna5wMPraoL51rsNk6X2/wImk9TfmeKvk9X1d9OsdiM0GXuHW/z2Rq70+O8S7N1m3dttr62zPJtPiufRx2/h3a6P1fbgkySJGm2WJ1PWUqSJM0KFmSSJEk9syCTJEnqmQWZJElSzyzIJM1JSU5Jck6Si5Msbtv2T/KjJGcl+ViSD7ftC5J8NsnZ7e2p/WYvaXXjpywlzUlJNqiqm5PcDzgbeBbwXWBbmh8k/gbwg6p6TZJPAx+pqu8k2ZzmtwIf1VvyklY7q/M39UvSihyY5Hnt9GbAi4H/rqqbAdpvEX942/9MYJvkD1/GvW6SB9TAjwtL0jAsyCTNOe1PnjwTeEpV3ZHkWzQ/6r28Ua81gCdX1W/GkqCkOcdryCTNRQ8CbmmLsUcCTwbuDzw9yfpJ5gHPH5j/q8ABE3cGfz5FkkbBgkzSXPRlYF6SS4FDgTOAa4F3AWfRXEt2JXBbO/+BwKIkFyS5BHjl2DOWtFrzon5Jak1cF9aOkJ0MHFlVJ/edl6TVnyNkkvRHb0tyPnAR8FPglF6zkTRnOEImSZLUM0fIJEmSemZBJkmS1DMLMkmSpJ5ZkEmSJPXMgkySJKln/x8TxrEZV9ShsQAAAABJRU5ErkJggg==", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "iVBORw0KGgoAAAANSUhEUgAAAOcAAAD3CAYAAADmIkO7AAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjQuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8rg+JYAAAACXBIWXMAAAsTAAALEwEAmpwYAAAgRUlEQVR4nO2dd5gURfrHP+/ukhwyKIqAGFExhwEFBbMwIoiCYlg9PXO688ep5zmKjuE8w3kqnJ55MGfUFQMiKKCOAQURMyhJlCUts+wuu1u/P6pXh3UzO1M9M+/neebZnu3uqm/39LffqurqKjHGoCiK/8hxLUBRlJpRcyqKT1FzKopPUXMqik9RcyqKT1FzKopPSRtzisg8ERncxH17icg6EcltXlUgIkZEdmjudJOJiIwTkcdc62gKIrJQRA53rSMVNMmcLk6QMaavMWZaQ7atrs8Y85Mxpq0xpiJpAhUARGQnEZkkIr+KyEoReUNE+iSsP0NEKrybZdVnsDvF/sX3kVNE8lxrUCxiqe+a6Qi8DPQBugExYFK1bd73bpZVn2nNLjYD2GRzenfCGSJym4isEpEFIjKk2vofRKTIW3dKwrqzRWS+t+5LEdnH+/9CEblCROYAcRHJS4yGXrHsORF52tv3UxHZ01s3EegFvOLdlS8Xkd5e8TPP26a7iLzs3dm/E5GzEzSNE5FnRCTqpT1PRPar5zQM9Y5xhYjcKiI5ItLSS3/3hLS3EJFiEdm8hvOYKyK3e2ksEJGLqmnuICIPisgyEVkiIjdUFdMb8BtsKyLTveN5C+haLe/+IjJLRFaLyOeJkUxEponIjSIyEygGtqvrRBhjYsaYB40xK40xG4B/A31EpEs957BGROQ0EflRRApF5B/V1uWIyJUi8r23/hkR6VxLOoNFZLF3PfzinccRIjJURL7xfqurErYPisj73jlZJiL3iEhLb914Ebm9Wvovi8hfveVdvPO22rt+jm3KsWOMafQHWAgc7i2fAWwAzgZygfOBpYAAAWAt0Mfbdiugr7c8ClgC7O9tuwOwTUL6nwE9gTY15DnOy/MEoAUwFlgAtKi+rfe9N2CAPO/7u8AEoDWwF/ArcGhC2iXAUO94bgY+qONcGOAdoDP2pvAN8Gdv3QTgloRtLwVeqSWd84AvgR5AJ2BKNc0vAvd553QLbEQ6t77fwFv/PnAH0Ao4GCgCHvPWbQ0UesebAxzhfd/cWz8N+AnoC+R55/tV4MoGXisjgGUJ388A4sAK71yFq46xhn13BdZ5mlt5x1CecB1cCnzgnbNW3vl5spa0Bnv7XuMdw9ne7/4E0M47vvXAtt72+wL9vWPuDcwH/uKtC3rnN8f73hV74+rmpf0dcBXQEjjUO999Gu2zZjLndwnrNvMuqi29C2k1cDyeyRK2ewO4tI70z6wjz3EkGMa7qJYBB9VnTqzhK4B2CetvBh5JSHtKtQtkfT3mPDrh+wXA295yP+yFXWWSj4HRtaQzFc9s3vfDEzR3A0oTzyEwBninAb9BL++iDCSsf4LfzXkFMLGG3+b0BHNe38TrpAf2Bjwm4X/bAdt6v9nu2BvS32vZ/xrgqYTvAaAs4TqYDxyWsH4r7E3qD2bHmnM9kOt9b+edo34J23wCjKhFy1+AFxO+zweO8JYvAl7zlg8CfsYzrve/J4FxjT1/zVXn/LlqwRhT7C22NcbEgROxUWGZiBSIyM7e+p7A93WkuaiePH9bb4ypBBYD3RugtTuw0hhTlPC/H7ERpIqfE5aLgdZSd903UeuPVTqMMR96+w/2jnsHbH2sNl2J6SQub4O9Iy/zikqrsVFii5o0J/4GXrqrvN8iUWNi2qOq0vXSHoi90GvS0iC8ovubwARjzJMJ2n4wxiwwxlQaY+YC12NLQDWx0TnxjqGwmvYXE3TPx954u9WSXqH5vVFwvfd3ecL69dhzVtWw9aqI/Cwia4Gb2Lg68Chwqrd8KjAxUbN3TVZR/fpqEElvEDLGvGGMOQL7Y38F3O+tWgRsX9eu9STds2pBbCNFD2xRo759lwKdRaRdwv96Ye/wTaVnwnKvBB3w+494GvCcMaakljSWYY+hpjQXYSNnV2NMR+/T3hjTtwHalgGdRCRQTWNi2hMT0u1ojAkYY/6ZsE2jXl0SkU5YY75sjLmxns0NtlpTm/bE33kzILHuuggYUk17a2PMpvyWVfwXe73uaIxpjy2mJup8DBjutXXsArzk/X8p0FM2bjhr0vWVVHOKSDcRGe5dGKXY+kPVHeUBYKyI7CuWHURkm0Ykv6+IjPQi2l+89D/w1i2nloYLY8wiYBZws4i0FpE9gLOwJ7up/E1EOolIT2w96OmEdY8Bx2ENGq0jjWeAS0VkaxHpiC1uVmlehr3YbxeR9l5DyPYiMqg+YcaYH7HF6eu8RqqBwLBq+oaJyFFeo1Rrr/GkR40J1oOItMcWi2caY66sYf0QEenmLe+MrXNWb82t4jngGBEZ6DXGXM/G1+y9wI1V142IbC4iw5uiuwbaYdtL1nk6z09caYxZDHyEjZjPG2OqInFVaelyEWnhNa4NA55qrIBkR84c4DLs3WQlMAjvII0xzwI3Yus/Rdg7T40tbbUwCVtkXoWNSiONbR0EW4e82ivujK1h3zHYeuhSbEPLtcaYKY05sBq0fIJtxCoAHqxa4d0MPsVGiPfqSON+rAHnALOB17B1xapiWD62geFL7DE/x8ZFz7o4GVv/XQlcS8JNwtM3HBsZfsVGo79Rx7UhIpMTWzarcRy2ke9PsvGzzKpofRgwR0Ti3jG+gC0y/gFjzDzgQuw1sgx73IsTNvkPtprwpogUYW/O/WrT3UjGYs9bEfa3ebqGbR7F1purirQYY8qwZhyCbfSaAOQbY75qrICqhoq0QkTGATsYY06tb1s/ICIPAUuNMVc3Yp8hwL3GmMaUJpQUIiIHY0se25gkGEkf8CcZEekNjAT2rme7NsAh2OjZDRvhXky2PqVpiEgLbBXmgWQYE9Kgh1A6IyIR4AvgVmPMgvo2B67DFt1mY1ser0muQqUpiMgu2EeEWwF3Ji2fdCzWKko2oJFTUXyKmlNRfIqaU1F8ippTUXyKmlNRfIqaU1F8ippTUXyKmlNRfIqaU1F8ippTUXyKmlNRfIqaU1F8ippTUXyKmlNRfIqaU2kSInKJ2AHBH09S+uNqGWIma9CREJSmcgF2/NjF9W6pNAk1p9JoRORe7OiGk0XkKewQp7thx9YdZ4yZJCJnYEd7DwA7ArdhByg7DTtS4lBjzEqxU2Gc4637DjgtYdzdqvy2B8YDm2NHtju7KQNmpRtarFUajTHmPOzIhYdgzTfVGBP0vt+aMEbubtjxk/bHjrRYbIzZGzs9RL63zQvGmP2NMXtih2Y5q4Ys/wdcbIzZFzsq3oTkHJm/0MipbCpHAscm1A9b8/ug1e94I+sXicga4BXv/3OBPbzl3UTkBuzsZG2xY97+hoi0BQ4EnhX5bUznVkk4Dt+h5lQ2FQGON8Z8vdE/Rfphi69VVCZ8r+T3a+8R7Pwkn3tF4cHV0s8BVhtj9mpW1WmAFmuVTeUN4GLxwpqI1DkEaA20w84B0wI4pfpKY8xaYIGIjPLSF28KhIxHzalsKhFsQ9AcEZnnfW8MYewUBjOxc5PUxCnAWSLyOTAPO0J9xqNDYyqKT9E6p8+JxuJbAzthpw/shm046VTt0xFbCipP+GxI+LsKO9dITZ+f8oOBqvlYFB+hkdMnRGPxXthWyb5YM+6EfT4YqGu/ZqAE+wjjc+wkSp8Dn+cHA4V17qUkHTWnA6KxeA72UcIA7ES1A9h4Pk4/sBQ7a9c7wDv5wcA8x3qyDjVniojG4p2xDRnHYadCbO9WUaNZjp1kaTLwpkbW5KPmTCLRWLw71owjgYPJnDp+JTANO/3d8/nBwFq3cjITNWczE43FO2Cb/k8F+lP7lOqZwnpsz5/Hgcn5wcCGerZXGoias5mIxuJB7Kzdo4HNHMtxRSF2evW78oOBb1yLSXfUnJtANBZviTXjxUDQsRw/UYmNprflBwMzXItJV9ScTSAai7fCvub0d+wEqkrtfIB9XezF/GCg0rWYdELN2QiisXgecCZwNf579OF3vsd27ZuoJm0Yas4GEI3Fc7ENPNdgXzJWms5nwNj8YOBt10L8jpqzHqKx+BDgDmBn11oyjNeAv+UHA1+6FuJX1Jy1EI3FtwL+A4xyrSWDqQAeAML5wcCvrsX4DTVnNbyudecDN5F+vXjSlRXARfnBwNOuhfgJNWcC0Vh8L+A+9LGIK54HLsgPBn5xLcQPqDn5LVpejW3wyXUsJ9tZAVyYHww841qIa7LenF7d8nHsyHGKf3gOOD8/GFjhWogrstqc0Vj8SGAisIVrLUqN/ASMzA8GPnEtxAVZaU6vM0EEuILM75ie7pQA5+UHA4+6FpJqss6c0Vi8K/ACcJBrLUqjGA/8NZveeskqc0Zj8R2wLwvv4FqL0iRmAKPyg4GfXQtJBVljzmgs3h94GTvfhpK+LAGOzIaeRVkxbm00Fh8BTEWNmQlsDbwbjcX3cy0k2WS8OaOx+MXYh9ttXGtRmo0uwNRoLD7YtZBkktHmjMbi/wDuIsOPM0tpB0yOxuLDXAtJFhl70UZj8bHADa51KEmlNfBCNBb/wxwrmUBGNghFY/GLgLtd61BSRiUwJtO6/GWcOaOx+NnYzuvauSC7KAOGZtJL3Bllzmgsno+d71GNmZ0UAYPzg4FPXQtpDjLGnNFYfCj2Oaa+VZLd/AIMyA8GvnMtZFPJCHNGY/GdsXM86svRCsAPwIH5wcBy10I2hbRvrY3G4p2wEVONqVSxHfBaNBZP62fbaW1Ob1S8p7FT5SlKIvsA97oWsSmktTmxo+Id4VqE36msqCB82oHccdkJANx7zZlcMWpvrhqzPw9Ezqe83L7o8dHUl/j7Sftx4zlHsG6NnURs+eIfGP+PfGfaN5F877FaWpK25ozG4n8CLnGtIx148+kJdO/d57fvBxx1Iv985lNufCJGWel6pk96BIApz97LuEfeZfBxZ/H+G/aR4fP3Xs/x517jQnZzcUc0Fu/nWkRTSEtzeq9+aSeDBrBy+RI+n/k6g4af/tv/9hxwFCKCiLBd3/1Y9csSAERyKC8rpaykmNy8Fnw9eyYdunRjy15p/YZdC+CpaCze0bWQxpJ25vTqmRNJ/nTsGcHj/76c0RfdgMgff+ry8g3Mmvwku/e3NYNjTh/LLRcN47MZk+l/5CgmPXQLw8+8ItWSk0Fv4GHXIhpL2pkTuBI776VSD5/NmEz7zpuz7S5717g++q+/0mevAfTZewAAu/U7lOujM/jr7c/y6bsF7HngUfz803fcfeUpPHTTRZSWFKdSfnMzwqsKpQ1p9ZwzGovvg521qoVrLenAM+OvZdbkJ8nNy2NDaQnr40Xse8ixnHfdg7z4wE389PUcLr7lCXJyNr5Hl5YU8+/LTmDsXZP492UncMktT/DR1Jco31DG4BFpdX1XZxWwa7qMpJA206BHY/HW2GnO1ZgNZPSF1zH6wusAmP/Ju0x+/C7Ou+5Bpk16hC8+eJsr7nn1D8YEeO2xOznixPPJy2tBWel6EEEkh7L0jpwAnbBtFWkxxUY6FWtvAHZxLSITePSWS1mz8hcifz6U8KkH8NIDN/+2btWvy1gw7xP2HWRfkzxi9HmMO+Ngpr74IP2PGu1KcnNygjcyhu9Ji2JtNBbfDZhNGkV6xdcsxRZv17gWUhfpEjnvQY2pNB/dgX+5FlEfvjfnnHfeHJ5jKg5wrUPJOM72Ghh9i7+LtQWRVsDXFeTwYdvDln/XZned/UtpTt7MDwaOci2iNvweOS8BtsmlcpsD170VHLXi3k87b1ie9u/pKb7hyGgsfqhrEbXh38hZEOkMfA90TPy3gYpf8rrPnNZh+O6lOW06OdGmZBIf5QcDviyR+TlyhqlmTACB3G7lSw8eXfhf9ls37V0xlRWpl6ZkEPtHY/HjXYuoCX9GzoLI5sAioFV9m5aT9+3M9kcX/dhqJ19X7hVf8zXQNz8Y8NWN3q+R81waYEyAPMp3HLT21X1GFt4fa1++8sck61Iykz6A78a+9V/kLIi0AH4EtmrsrgbKlrTs/f577UL7bMhp1a75xSkZzKf5wcC+rkUk4sfIOYomGBNAoGWPsoWDTiqcsH7P+KwZ+O7Oo/iYfaKx+EDXIhLxozkv3dQEBLPFnsUfDBxTeM/8rcoWzm0OUUpWsMnXXnPir2JtQaQ/8H5zJ7s6t/OstzuM3Dae275JEVnJGiqA7fKDgZ9cCwH/Rc6kjAnUsWLlgSNXPtDh4LWvTs81G9YnIw8lI8gFLnQtogr/RM6CSHdgIUl+X7MSWfJJYNBP8zfbR/vrKjWxCtg6PxhwfhP3U+S8gBS8SJ2D2Xr/+LQDTlwx4fPNNyz9Ktn5KWlHJ+AY1yLAL5GzICLYTgdbpzJbA5WFed1mTu0wYueSnIBOSa9U8Xx+MHCCaxF+iZz7kmJjAgjkdC1fftCowvta9S96a7qYig2p1qD4kqHRWLytaxF+MeexLjMXaL9TydxBJ6+4e/H2JfNiLrUovqANjq9J8I85h7kWAJBL5bYDit4InlB438edyn/53rUexSknuhbgvs5ZEOkJ+OK5UiIGype36DFrWvthe5TltOnoWo+ScsqALVyOM+SHyOm8+FATAnlbblh88ImF/63cd910fTUt+2iJ4xKdH8zpiyJtbQh07rv+k4PHrLjnh16l3852rUdJKYe5zNxtsbYg0g5Ygb1LpQVFOe0/nNLh+O5FeZ16utaiJJ2F+cHAtq4ydx05jyKNjAnQrnJtvxGrHt7i0DUvTs+rLFvnWo+SVHpHY/HerjJ3bc6hjvNvEgKtepQtGHRS4fj47vEPZuqraRnNYFcZuzbn/o7z3yRyMN32Lp414KTC8V9uWfbjF671KElhsKuM3dU5CyItgTgZMpK7AbMmt8usKR2O265YX03LJH7MDwZ6u8jYZeTclQwxJoCAdKwoHHD8ygfaD1z72vRcU17iWpPSLGwTjcV7uMjYpTn3dJh30hAIbFf61aAxK+5Z0Wf97GZ/cVxxwm4uMlVzJokcKnv0W/fOAaNXTPis64ZlX7vWo2wSfV1k6tKcezjMO2W0NiV7DVn95I5DVj3xXuvK+ArXepQmsauLTDVypgCBnM3Lfz5oVOF9LfoVTdFX09IPJ5HTTWttQWQr7ASmWUkFuQtmtTuycEHrXfZzrUVpEGvzg4EOqc7UVeTMmqhZE7lUbHtQ0eT9Tii87+OO5b8ucK1HqZf20Vg85d01XZlzF0f5+orNKuP7DVs1sccRq5+d3qKyxNdToCvslOoMXZlTH9J7CLTYasOiQScVTtiw97r33sOYStealBrpluoMXZlzC0f5+haBrruv/+igk1fc/W2P0u8/c61H+QMpHwDOVQ8dNWct5FHe59C1kyjK6fDBlI4jexTldnLSO0X5Ayk3p0ZOn9Kuck3/ESsf7jp4zaTpeaYs7lqPkj3m7OIo37RCoHWvsu8HnbRi/NrdimP6appbssac7R3lm5bkYLbaJz5jwEmF4+d1K1s0z7WeLCVrzBlwlG9a09KU7Xbkmmd3HbYyOmOziqLlrvVkGSkv7aXenAWRPBo4pbzyRwSkU8WKgcevvD8wYO3k6TmmvNS1piwh5cPpuIiczoe5zwQE2m5fOn/QySvu+WWn9Z9/6FpPFpCb6gxdmFOjZjOSQ2XP/uve7jd6xX9nd9nw87eu9WQwKTeni+ec+lggCbQ26/ceuvqJSmClay2ZiEHWwNUpzdOVOQ0gDvLOaMSWhDq71pGJCGZ1qvNMfbE2FDZo9FTSj5S/g+vqUUqRo3wVpamUpzpDNaeiNIysiZw6jYGSbqT8fVuNnIrSMFI+h6yaU1EaxqJUZ6jFWkVpGFkTOXX8ViXdyJrI+ZWjfBWlqWRN5PzSUb6K0lSyJnKqOZV0Yi2hcJY8SgmFlwOFTvJWlMaT8qgJbudK0eippAspr2+CmlNRGsJcF5mqORWlfma4yNSlOXUUOSUdMMBMFxlr5FSUuplPKOxkdAl35gyFlwGLneWvKA3DSdQEt5ETYLLj/BWlPpzUN0HNqSj1kbXmnIKDN8wVpYEsIxT+wVXmbs0ZChfhsEyvKPXg9Np0HTlBi7aKf3nXZeZqTkWpmUrgeZcC3JszFJ6LPlJR/Mc0QuGlLgW4N6flddcCFKUaj7kW4BdzFrgWoCgJlOC4SAv+Medr6Pudin94hVB4rWsR/jBnKFwGTHQtQ1E8HnctAPxiTsv9rgUoCnYKxddciwA/mTMU/hJ437UMJet5llDYF73W/GNOy32uBShZj/NW2ir8Zs6ngF9ci1Cylrn4qDupv8wZCpcC97qWoWQtt3iTO/sCf5nTMgEocy1CyToWYEtuvsF/5rRj2j7pWoaSddxGKFzhWkQi/jOn5Ub0PU8ldSwHHnItojr+NGco/C1a91RSx02EwiWuRVTHn+a0XIeDqb6VrGMRPn2E519zhsKF2OKtoiSTiPeUwHf415yWu4CFrkUoGcv3wMOuRdSGv81p72hXuZahZCx/IRQudy2iNvxtTstTQMy1CCXjeIpQ+FXXIurC/+a0PTb+z7UMJaMoBC5xLaI+xBjf9Faqm4LIs8AJrmU0B73PvIN2bVqSm5NDXm4OH995Hp/9sIzzxr9CSVk5ebk5TDj/GIJ9evD8zHlc8/hUOrdtw0tXn0yX9pvx/bKVXBWdwtNXjHZ9KOnKaYTCvungXht5rgU0gguAgcCWroU0B+/c9Ce6dgj89v3yh9/k2jGDGbLfTrz20Tdc/vCbTPvnmdz9yod8dMe5vPD+fJ6YPoeLh/Xn6olvc8OphzlUn9a8ng7GhHQo1lYRCv8KnI6dki3jEGBtsW3RX1NcQvcu7QDIyRFKyysoLt1Ai9xc3vtiIVt2asuOW3dxqDZtWQec61pEQ0mfYm0VBZHbgctcy9gUtj3rDjq1bYMA5w7Zn3OO3o/5i37lqGuiGGOorDTMuu1sttmiI2/N/o4rH3mL7p3b8djYExj1z6d56vJRdG63mevDSEcuIRS+27WIhpKO5mwJfAjs5VhJk1myYi1bd23PL6vXccTVj3L3eSGemzmPQbv15vgBfXnmvS/43+sfM+XGMzbaL/r2Z6xcV0z/Pj257YWZdGrbhv+cM4TNWrd0cyDpxfvAQELhStdCGkr6FGursIOBjQGKXUtpKlt3bQ/AFh3bctwBuxD7ZjGPvv0ZIw/cFYBRA/sS+2bJRvsUl5TxyNuzuTDUj2sfn8qjl41kYN9ePD5tTsr1pyFFwJnpZExIR3MChMJfkaZF23hJGUVe3TJeUsabs79nt2260b1zO6bPXQjA1M9/YMfunTfa79YXZnLJsP60yMtlfVk5AuSIUFyqL+/UQyVwsnfNpBXp1Fq7MaHwfRREjgZGuJbSGJavXsdxN9jXVcsrKzl50B4cve+OtG3dkkv/9xrlFZW0bpnH/y4e/ts+SwvXEvtmMdeefAgAFw/rx/6X3UfHQGteuvpkJ8eRRlzt984GtZF+dc5ECiJdgNlAT9dSFF/yBKHwKa5FNJX0LNZWYd9cGQKsci1F8R0fA2e5FrEppLc5AULhecCxwHrXUhTfsAwY4ccXqBtD+psTIBSeAZwE+GoMGMUJpcBxhMJL6t3S52SGOQFC4ZdJo94fStI4h1D4Q9cimoPMMSdAKPwgEHYtQ3HG/xEKR12LaC7Su7W2NgoidwMXuZahpAwDXEQoPMG1kOYksyLn71wKPONahJISKrFF2YwyJmSqOW03rdNQg2Y6FcDphMIPuBaSDDLTnJDYB3e8aylKUigHxqTLu5lNITPrnNUpiFyDHQdXyQzKgNGEwpNcC0km2WFOgILIOdgomr79iRWAEmAkofBk10KSTfaYE6AgcgTwLNDBtRSlSSzGGvMj10JSQXaZE6AgsgvwKrCdaylKo3gXGEUonDWTK2dug1BthMLzgX7ANMdKlIZzD3B4NhkTsjFyVlEQycGOh3sDoON8+JMi4FxC4aycrzV7zVlFQWQPYCKwh2spykZ8ApxEKPydayGuyL5ibXVC4TnA/sC/sL1NFPfcCRyYzcYEjZwbUxA5CHgU2Na1lCxlHraP7DTXQvyARs5EQuH3gD2BB11LyTKKsPX/vdSYv6ORszYKIkOB24BdXEvJcJ4AxhIKL3MtxG+oOeuiIJKLnQLiOqCHYzWZxjzgQkLh6a6F+BU1Z0MoiLTGvh/6d6BzPVsrdVMEjAPu8vPEtX5AzdkYCiIdgMuBvwA6WUnjWA3cC9xJKLzcsZa0QM3ZFAoiWwHXAH9GO9LXx0Lso5EHCYXXuZWSXqg5N4WCSE/s2KhnogNbV+djbIPac4TCOipiE1BzNge2K+DRwDlAiOyNpgYoAG7Thp5NR83Z3Ngi75+wRd5s6cwwD3gBO/1B2k0Y5FfUnMmiICLAYdhi71CgvVtBzc7HWEO+QCj8tWsxmYiaMxUURFoAA7EmHQL0dSuoSVQCM/ndkD851pPxqDldYBuSBnmfwcAOTvXUTAXwBfABdlbo1/URSGpRc/qBgkh34ACgD7ATsKP3t2uKFJQC84G5wBxskfUjQuF4ivJXakDN6WcKIp2wJk38dAfaAK0T/iYuS0IKxcCv9Xx+AL7W3jr+Q82ZaRREWmKNuoFQuNi1HKXpqDmbCREZDIw1xhzjWIqSIej7nIriU9ScCYhIbxH5SkQeEZFvRORxETlcRGaKyLciEvQ+74vIbBGZJSJ9akgnICIPiUjM2264i+NR0hs15x/ZAbgd2Nn7nIx9RjkWuAr4CjjIGLM3tvP7TTWk8Q9gqjEmCBwC3CoigRRoVzKIbO0DWhcLjDFzAURkHvC2McaIyFygN3a0+EdFZEdsX9IWNaRxJHCsiIz1vrcGemEfVyhKg1Bz/pHShOXKhO+V2PMVAd4xxhwnIr2peXBqAY43xmi3NqXJaLG28XQAlnjLZ9SyzRvAxSIiACKydwp0KRmGmrPx/Au4WURmU3vJI4It7s7xisaRVIlTMgd9zqkoPkUjp6L4FDWnovgUNaei+BQ1p6L4FDWnovgUNaei+BQ1p6L4FDWnovgUNaei+BQ1p6L4FDWnovgUNaei+BQ1p6L4FDWnovgUNaei+BQ1p6L4FDWnovgUNaei+BQ1p6L4lP8HaIYIvynTpPYAAAAASUVORK5CYII=", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "import warnings\n", + "warnings.simplefilter(action=\"ignore\", category=FutureWarning)\n", + "# Bar\n", + "grafBar(df1.gender,df1.university[0])\n", + "grafBar(df1.career,df1.university[0])\n", + "grafBar(df1.age,df1.university[0])\n", + "# Pie\n", + "grafPie(df1,df1.age,df1.university[0])\n", + "grafPie(df1,df1.gender,df1.university[0])\n", + "grafPie(df1,df1.inscmonth,df1.university[0])\n", + "# Box\n", + "grafBox(df1.gender,df1.age,df1.university[0])\n", + "grafBox(df1.career,df1.age,df1.university[0])\n", + "\n", + "# Location \n", + "grafLocation(df1)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "ccda0263", + "metadata": {}, + "outputs": [], + "source": [ + "\n" + ] + }, + { + "cell_type": "markdown", + "id": "2e907e1c", + "metadata": {}, + "source": [ + "# Universidad Grupo B salvador\n" + ] + }, + { + "cell_type": "code", + "execution_count": 115, + "id": "f41d6e62", + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "iVBORw0KGgoAAAANSUhEUgAAAaYAAAHbCAYAAACAzT4cAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjQuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8rg+JYAAAACXBIWXMAAAsTAAALEwEAmpwYAABnHElEQVR4nO2dd5gkVdWH3x85LyAoQXDJWQHJcQmSBRQQBAVEQFDBgKifEhYERJIYQBCEBUSQjOS0ZERYguTMkvMShYVl53x/nNs7tb3d0zPd1dU1Ped9nnpmqurWPfdWV9W54dxzZGYEQRAEQVmYqtMFCIIgCIIsoZiCIAiCUhGKKQiCICgVoZiCIAiCUhGKKQiCICgVoZiCIAiCUtFQMUkaKenNIgrTHySNkGSSlh3gdatIGlnjeKH1kzRK0pg25b1rujeztCP/BrJLcX/zIt3H6u3Ofl73wyLK2F+afWfaiaSbJF3QIM0sqdy75iBv2ZTXiCauHSNp1ACvKeRdLPq3lfRDSW1fYzRNuwW0gXuB1YGnB3jdKsDBwMiq46cCl7VerCFPN97fY4Hsx/P9flyzOvBse4rTNM2+M+3k+8CEThciKCeDRjFJEjC9mb0HNGy59hczexF4Ma/8gskp+v5Kmgd4z8w+zCG7sWY2oGdtoOmLIO93pi8kzWhmHzVKZ2aPFFGeoJw0ek4GPMeU6TqOkHS+pA8kPSPp+1XplpF0taRxkv4n6VFJP6hK8zVJd0n6SNJbkq6U9IV0bqSkNyWtJeluYDywXa2ua9r/qaQ/JHnvSPqTpOnS+V2BP2XSmqSbsnKqyrWQpEskvSfpfUmXSVq0Ko1J+pGkIyS9Iel1SSdImr6f93FrSY9JGi/pNklLZ86dVylf1TUjJb0madr+yEjXzCXpjHR/P0xDKCvVSLeHpAdTeV6TdIGkYenc6pL+JemV9FveL2mnzLW7Up77uwnwiqSTJa3c3/uUF6oaykv3+wJJO0p6KtX5Kkmfb5BPzSHQGvmPlXSMpJ9IelHS25LOlTR7Js1k70wq0/k18j5a0vOSlPZnkHSUpBckfSzpv5I2q7pmrKRjJR0o6UXgvXS8z/dfNYbyJG0j6Qn59+AWYMkaZdw5vS/jUl1vrPM8fz+V+3+SLgPmrX+3J7tuWUm3p/fgUUlb1km3tqSb0zv1lqRTJM3aHxmZPGaXdKqkl5O85yWdkjm/ZPotX0hyHpb0Y0l1v9sD+G2PTO/7B+m5OVveqMteM72kP8u/p+Mk/R6Y4tszgPf5p5KOl/QG8GCfN8fM+tzwoZk3M/sjAAOeBA4AvgKclo6tkkn3DHAFsBmwAd51/2Xm/LfTNecAXwW2BI4HVsrI/RAffvgesB6wREb+spm8DHgJuBDYFPgZ8DFwdDo/N3BMSrda2pauU7/pU9kfB7YHtgEeSvnPWSXzeWAUsDGwP/Ap8PMG93MU8EaSsRPw9fQjvQDMkNJsDPQAC2WuEz5EdGwfee+ayjVL5thtwKvAd9J9vgUfklo0k+aAJO/P+If968DfgPnT+R2AX6Tfcn3gQOAT4JslvL/DgH2B+1IeD6T9Ofu6rkY+BryZZL6JP+MN80jX/TCzf1P6be8Atkr38jXgyoG8d33kPzbdp8vT77Mn8AFwYo13dtm0vzfwP2DmqufrOeCYzLHLgddT+o3wYdlPgeWr5L8CXI+/w1/v5/t/E3BBZn/FlPf5+Du8f8rDgF0z6Q5KddwgpTsT+AhYOJNmq3TdX9Kzc0T6DQwY0cc9nzE9h//F34GdUhleB0Zl0q2Jf1/+mer37XRdtj67UvUu1pB3GvAY/h6sC3wL+Gvm/AbAIfh7OwL4MfAu8H85/LanAd9McrcF/g08AkyVSfN7vEOwX7rXF+GjH9bk+/xKumebAJv1+fz340UbSW3FdGjm2LT4x/bItD9XSrNcnTynSgW/qIFcA7aqOj7ZD5Gp9GNVN/XXuGKbM+3/MHtD+6jfXvgLkn3QP49/iP+vSuYtVXldAtzZ4H6OSteukTn2hSRzr8z9eR44JJNm/ep618h7VzIvQ3oADFg3k2bm9FudnPZnT/fpuEbPQuYhnwY4GRidOV6K+1uVfkW8J/cW/oKdA2wIqB/XjsJfsnWAnwJvA/cAUze4rpZieheYI3PsxyndjP197/rIfyzeeJsmc+x44NV67wzekPgU2CGTZvWUptIw3KD62UnHbwHOr5L/CqlRlY71+f5n7kv2Q34e/mFU5tivqVJMVXlMlZ7Fx4CDMsfvAq6qSnsKjRVTZd7r85lja6brRmWO3QrcWHXtZO8n/VNMDwH7DPC9+xXwTCu/bY28pwbmT2nWScc+gyv8X1Td78eYXDEN5H2+t7/vbivm4tdW/jGzCXgPqjI8MQ5voZwkaXtJn626dglgPuD0BjIMuKqf5bnUzHoy+xfhLaCBWqusgt/AZyYVwudJbgfWqkp7bdX+I/Teg7543czuyOT/HP7RWyXt9+D3ZudK1xt/0MeY2UP9rwqrJFk3Z2T9D28JV+qyOn6f6v4WkuaQ9EdJz+Ev7gS81br4AMqSLVO7728l33vNbB/8WdsFmAO4Bm/hNbp2VzO70MxuMbPjgB1xRffV/srPcLeZvZ3Zr8yvzN9EXrW40cw+rcr/s6oz5GtmbwCj8RZuhe2Bp82sYjG6Id7Tvl3SNJUNuAGoHjq7wczGZ/Ybvf+1WAX4l6WvWOKi6kSSlpJ0saTXgIn4s7gE6VlMZVwRuLTq0inyqlOGe9LzCICZ3Y73mCryZ8LfmfOq7sttqSxf7oecCvcD+6dhxynepTSUeoikp/Ae2gTgcGChJHMK+vnbImlTSXdIehdXLJU6V8qxHDADmfuYvkvV93Ug7/OVtcpci1YU0ztV+5/gFalUYCP8wT4NeFXSrZJWSGk/k/6+0kDG22b2ST/L83qd/X6NLWeYFx9qqeY1YM6qY+9U7U+6Bw2oLmvlWLasp+M9qfXS2PU2+L0cCPPWkZWtS39+i1H4w300/ruunMrSn7rWKlO77281M+BDfLPjz/zbfaauzdX4ENmKTVz7TtV+5Zlupi79zV/4MEs9zgU2lTRbmrPYDh9mqTAXMA+9DZHKNhJYoCqvyX7Pfrz/tZiH+u8wAOk9uDbJ/ymwNv4s/pfeezkX3gPoM68BlKH62jlS/icy+X35GB85qr43ffFDfBTgIOBxSU9K2iFz/nf4tMRf8SHDlYHD0rm+np0+f1v53Ou/cGX0bVzRrlaVb2W+qdF9HMj7XCtdTdpmlWdmjwHbpFbb2vhNvkI+6ftWStZIaViD81mqW2WV/UbKr5pXgGVqHP8c3hLMg1otyM8CD1d2zGyspOvxntJC+Af1nAHKeaWOrGxdsr9Frcn2GYAtgB+Y2UmZ4802aoq4vxUrzvXxubWv4x/rfwB7m9l9A83PzCx1XgfyTLbCeGC67AFJc+SY/8X4HMxW+PzDfEyumMbhw+1b9yOvKe5JX+9/1chGhVep/w5XWB3vMX8l5Q+AkpFO4k28J9Uor1q8Sg2Di6pr38HrO5LaPYCX+yEHADN7B5//3FfSF4GfA2dLesDcanE74E9mdlTlGkmb9yPrRr/t1/Dh/O0rPVQlo7MMr6a/n2Xy97L6Pg7kfe73u9N2zw9mNsHMRgPH4R+/2fGJspfw4ZW82KrqY/l1fIy0MvT1CUz60PbFf4AvS1qockDS/MAaeHc9Dz4raY1M/gviLfG7qtL9De8pfR+4JD3IA+E/SdY6GVkzAZvTW5d/4/ep3m8xPf6cfJzJY1Z8ojtLKe6vpM/JF/o+i0/IL4CPg89rZt9vRimlfDcBZsGHXIvgRWDWdG8qbJRX5mlo8Vq8J7w98KiZPZBJcgPeav7AzMZUbwOQU+v9r8XdwJaZoWvwdzjLjOlv9llcAxiekfcpbviyVdW11XnVK8OXlbGYlLQmmY9xGgq/E1ii1n0xs34rpizp3u+Pv2sV5Tgjk9d1atx4plFejX7bGYEJVcOmOzE5D+KNo0n3MX1fq+9rW97ntvSYkvY/BtfSz+Dd318A/zWzcSlNpXVwNt4TMLyFe85AHvwMswLnJ3PLZXDLsRMq8vBJO4AfSRqNr3V5vEY+o1JZr5J0EN76OhhviZ3cRLlq8Sbwd0kH4ErhEJLlT1W6S/AhgxWB/xuoEDO7RtIdwD8l/RLvHf0MfzCPTmnekfQb4HC5ef2VuDLaHDe+eElurn+QpPdw671f4hP6s2XEleX+boorojOAU83syYFmIGlPfB7l+lSuFXHLxbtwS7MiuBp/Nk6TdCzea94rZxn/xIfa3sUtMrNch8/HXSfpd3hvfjZgedzQoe7z2J/3vwa/wz9y50n6Gz43/N2qNHfiw6mnSDoK7z2NxBu5WY4ALpL0F7z3sC5uCNSI0/Hf+YrUuJkR+A1TjiT8HLhBUg++APt9YEH8nfm1mT3RD1lIui2V7yH8+7cHblFXaaBeB/wgzTGNA35A38OzWRr9tj+WdDy++H0N3CJwEmb2lqS/AodI+hT//ffAG2dZRtGO97mRdQT1rfKWrUp3E8nKBm9hnIU/lOPxbuE5wIJV13wdb4GOxz+aVwBfqCW3L/lp/6f4D/A2/mOcgC/IzVq1HIV3tXuAm+rJARbGlcL7+ItwObBYVZrJrKP6KnNVmlHAmFT3J/AW0e3V9zOT/u+4hd5UfeVrdSyBcCudM9N9+Qi4GVi5xrXfwyfNP06/13nAbOncongL+n+pLD+v8VyU5f7OScZCrZkNt0i7PT2TE/CJ/D8Cw/pxbbXV3E1krM/6eodq5LUp/kH4ELcEW6pG/mPJmAHXeg7qycMbcx+mc0vUkD893mh6Cu8Rv4orzM0byG/4/te5L9slWePx1vbKTGkuvgn+If8IXwqwWZ28foj3Oj/EG1sb0cAqL133Rdy0/2N8ZGdr/H0dVZVu1XQv3sPfi0fwXuGweu9iDVlH4z2T9/EhwhuBtTPnP4crrvfw+ZmjcOWQx2/7c/y5/h/eAFusxrM1Pd4wfhf/fvwJ/85aHu9zX5vSRYMaue+mfcysumUwqEmWN88Bp5nZgZ0uTxAEQREMGpdEQ4k0pPYl3ET5M+Q3hBgEQVB6QjGVk/nwcebXge9ZZl1FEARBt9MVQ3lBEARB9xCBAoMgCIJSMeiG8uaaay4bPnx4p4sRBEEwqLjnnnveNLO5O12O/jDoFNPw4cMZM6YtAWCDIAi6luTrclAQQ3lBEARBqQjFFARBEJSKUExBEARBqWhKMUnaVh66/FZ5OF2T9PcG16whD50+Th46+QF5mOCpmyt6EARB0I00a/xwAO6Z4APcH1UtV/GTkLQVHvZ8PO5ccBwecO33eITI7ZosRxAEQdBlNDuU9xM80uFseIz5ukiaDQ9rPBF3oPhdM9sf91L8b2DbquBYQRAEwRCmKcVkZjea2ZPWP7cR2+Iers+1TDgL81DMB6TdPpVbEARBMHQowvhh/fT36hrnbsFds68hqb9xRoIgCIIupgjFtET6O0XwLPNok8/ic10LF1CWIAiCoOQU4flhWPr7bp3zleOz18sgRRTdE2DBBRfMrWBBebjhjEeaum6DXZbOuSRBM3z8xoNNXTf93MvlXJKgGxgU65jM7K9mtpKZrTT33IPC1VMQBEHQJEUopkqPaFid85Xj77S/KEEQBEHZKUIxPZ7+Ll59IoUOXwj4FHimgLIEQRAEJacIxTQ6/d2kxrl1gJmAO8zs4wLKEgRBEJScIhTTBcCbwA6SVqoclDQDcFja/UsB5QiCIAgGAU1Z5UnaGtg67c6T/q4uaVT6/00z+xmAmb0naQ9cQd0k6VzcJdGWuCn5BbiboiAIgiBo2lx8eWCXqmML07sW6TngZ5UTZnaJpHWBXwPbADMATwE/Bf7YTw8SQRAEwRCgKcVkZiOBkQO85nZgs2bkBUEQBEOHQbGOKQiCIBg6hGIKgiAISkUopiAIgqBUhGIKgiAISkUopiAIgqBUhGIKgiAISkUopiAIgqBUhGIKgiAISkUopiAIgqBUhGIKgiAISkUopiAIgqBUNOvENegAl9ywzYCv2XqDC9tQkiAIgvYRPaYgCIKgVIRiCoIgCEpFKKYgCIKgVIRiCoIgCEpFKKYgCIKgVIRiCoIgCEpFKKYgCIKgVIRiCoIgCEpFKKYgCIKgVIRiCoIgCEpFKKYgCIKgVIRiCoIgCEpFKKYgCIKgVIRiCoIgCEpFoYpJ0uaSrpX0oqSPJD0j6XxJqxdZjiAIgqC8FKaYJP0OuBxYEbga+ANwL7AVcLukbxVVliAIgqC8FBIoUNI8wM+A14AvmtnrmXPrAaOBQ4G/F1GeIAiCoLwU1WP6QpL1n6xSAjCzG4H3gbkLKksQBEFQYopSTE8CnwCrSJore0LSOsCswPUFlSUIgiAoMYUM5ZnZOEm/AI4DHpF0CfAWsAiwJXAd8L0iyhIEQRCUm0IUE4CZHS9pLHAasEfm1FPAqOohviyS9gT2BFhwwQXbWcwgCIKgwxRplfdz4AJgFN5Tmhn4MvAMcLako+pda2Z/NbOVzGylueeOqaggCIJuphDFJGkE8DvgX2b2UzN7xsw+NLN7ga8BLwH7SVq4iPIEQRAE5aWoHtMW6e+N1SfM7EPgrlSWFQoqTxAEQVBSilJM06e/9cbhKsc/KaAsQRAEQYkpSjHdmv7uKWn+7AlJmwJrAuOBOwoqTxAEQVBSirLKuwBfp7Qh8Kiki4FXgaXwYT4BvzSztwoqTxAEQVBSilrH1CNpM+AHwA64wcNMwDjgSuCPZnZtEWUJgiAIyk2R65gmAMenLQiCIAhqEvGYgiAIglIRiikIgiAoFaGYgiAIglIRiikIgiAoFaGYgiAIglIRiikIgiAoFaGYgiAIglIRiikIgiAoFaGYgiAIglIRiikIgiAoFaGYgiAIglIRiikIgiAoFYU5cQ2CMjHz8Heauu5/Y2dv6rrbd/5ZU9eteeYxTV0XBIOZ6DEFQRAEpSIUUxAEQVAqQjEFQRAEpSIUUxAEQVAqQjEFQRAEpSIUUxAEQVAqQjEFQRAEpSIUUxAEQVAqQjEFQRAEpSIUUxAEQVAqQjEFQRAEpSIUUxAEQVAqQjEFQRAEpSIUUxAEQVAqCldMkjaQdLGkVyV9LOllSddI2qzosgRBEATlo9B4TJKOAvYHXgT+BbwJzA18GRgBXFlkeYIgCILyUZhikrQHrpTOAPY0s0+qzk9bVFmCIAiC8lLIUJ6k6YHDgeepoZQAzGxCEWUJgiAIyk1RPaav4EN2xwM9kjYHlgXGA3eZ2b8LKkcQBEFQcopSTCunv+OB+3ClNAlJtwDbmtkbBZUnCIIgKClFKabPpr/7A48AawP3AwsBxwAbAefjBhBTIGlPYE+ABRdcsK6QhTddq6nCPXPVbU1dd9cBczZ13SqHjWvquiJZ8NjhTV33/H5jcy1H0Bwz/KmnqevG7zM4VpB8eeVHmrrunruXbuq6Ty9drqnrptnqwaaum36705q67uPzd2vqurJR1FNYkfMpsKWZ3WZmH5jZg8DXcCu9dSWtXutiM/urma1kZivNPffcBRU5CIIg6ARFKaZ30t/7zGxs9oSZfQhck3ZXKag8QRAEQUkpSjE9nv6+U+f82+nvjO0vShAEQVBmilJMNwAGLC2plsyKMcSzBZUnCIIgKCmFKCYzew64DFgQ+FH2nKSNgI3x3tTVRZQnCIIgKC9FuiT6AbACcFxax3QfbpW3NTAR2N3M3i2wPEEQBEEJKUwxmdmLkr4MHARsCawDvIf3pH5rZncVVZYgCIKgvBTqxDUtoN0nbUEQBEEwBYNjNV0QBEEwZAjFFARBEJSKUExBEARBqQjFFARBEJSKUExBEARBqQjFFARBEJSKUExBEARBqQjFFARBEJSKUExBEARBqQjFFARBEJSKUExBEARBqQjFFARBEJSKUExBEARBqQjFFARBEJSKUExBEARBqQjFFARBEJSKUExBEARBqQjFFARBEJSKUExBEARBqQjFFARBEJSKUExBEARBqQjFFARBEJSKUExBEARBqQjFFARBEJSKUExBEARBqQjFFARBEJSKjiomSd+SZGnbvZNlCYIgCMpBxxSTpAWAPwMfdKoMQRAEQfnoiGKSJOB04C3gpE6UIQiCICgnneox7QusD3wH+F+HyhAEQRCUkMIVk6SlgCOBP5jZLUXLD4IgCMpNoYpJ0jTAWcDzwK+KlB0EQRAMDqYpWN5BwArAWmb2UX8vkrQnsCfAggsu2KaiBUEQBGWgsB6TpFXxXtKxZvbvgVxrZn81s5XMbKW55567PQUMgiAISkEhiikN4Z0JPAEcWITMIAiCYHBSVI9pFmBxYClgfGZRrQEHpzSnpGPHF1SmIAiCoIQUNcf0MfC3OudWxOedbgMeBwY0zBcEQRB0F4UopmToUNPlkKSRuGI6w8xOLaI8QRAEQXkJJ65BEARBqQjFFARBEJSKjismMxtpZophvCAIggBKoJiCIAiCIEsopiAIgqBUhGIKgiAISkUopiAIgqBUhGIKgiAISkUopiAIgqBUhGIKgiAISkUopiAIgqBUhGIKgiAISkUopiAIgqBUhGIKgiAISkUopiAIgqBUhGIKgiAISkUopiAIgqBUhGIKgiAISkUopiAIgqBUhGIKgiAISkUopiAIgqBUhGIKgiAISkUopiAIgqBUhGIKgiAISkUopiAIgqBUhGIKgiAISkUopiAIgqBUhGIKgiAISkUopiAIgqBUhGIKgiAISkUhiknSZyTtLuliSU9J+kjSu5Juk/RdSaEggyAIAgCmKUjOdsBfgFeAG4Hngc8BXwdOBTaVtJ2ZWUHlCYIgCEpKUYrpCWBL4Aoz66kclPQr4C5gG1xJXVhQeYIgCIKSUsgQmpmNNrPLskopHX8VOCntjiiiLEEQBEG5KcPczoT099OOliIIgiAoBR1VTJKmAXZOu1f3kW5PSWMkjXnjjTeKKVwQBEHQETrdYzoSWBa40syuqZfIzP5qZiuZ2Upzzz13caULgiAICqdjiknSvsB+wGPAtztVjiAIgqBcdEQxSfoh8AfgEWA9MxvXiXIEQRAE5aNwxSTpx8CfgIdwpfRq0WUIgiAIykuhiknSL4DfA/fjSun1IuUHQRAE5acwxSTpQNzY4R5gAzN7syjZQRAEweChEM8PknYBDgUmArcC+0qqTjbWzEYVUZ4gCIKgvBTlkmih9Hdq4Md10twMjCqiMEEQBEF5Kcol0UgzU4NtRBFlCYIgCMpNpxfYBkEQBMFkhGIKgiAISkUopiAIgqBUhGIKgiAISkUopiAIgqBUhGIKgiAISkUopiAIgqBUhGIKgiAISkUopiAIgqBUhGIKgiAISkUopiAIgqBUhGIKgiAISkUopiAIgqBUhGIKgiAISkUopiAIgqBUhGIKgiAISkUopiAIgqBUhGIKgiAISkUopiAIgqBUhGIKgiAISkUopiAIgqBUhGIKgiAISkUopiAIgqBUhGIKgiAISkUopiAIgqBUhGIKgiAISkWhiknS5yWdJullSR9LGivpeElzFFmOIAiCoLxMU5QgSYsAdwCfBS4FHgNWAX4EbCJpTTN7q6jyBEEQBOWkyB7TibhS2tfMtjazX5rZ+sDvgSWAwwssSxAEQVBSClFMqbe0ETAWOKHq9MHA/4BvS5q5iPIEQRAE5aWoHtN66e+1ZtaTPWFm7wO3AzMBqxVUniAIgqCkFKWYlkh/n6hz/sn0d/ECyhIEQRCUmKKMH4alv+/WOV85Pnutk5L2BPZMux9IeryJMswFvFkn/yaya14eh+cur74siq2bflbwvdy1HeL6elaKlcdZxxYqT/u2Q1xfz2ex8gr//Yp+//Tdvq77QjsK0w4Ks8prBTP7K/DXVvKQNMbMVsqpSKWS1811C3khL+R1Vl4nKGoor9IjGlbnfOX4O+0vShAEQVBmilJMlaG3enNIi6W/9eaggiAIgiFCUYrpxvR3I0mTyZQ0K7Am8CFwZxvL0NJQYMnldXPdQl7IC3mdlVc4MrNiBEnX4GuZ9jWzP2WOHwf8BDjZzPYqpDBBEARBaSlSMVW7JHoUWBVf4/QEsEa4JAqCIAgKU0wAkhYADgU2AT4DvAJcDBxiZm8XVpAgCIKgtBSqmIIgCIKgEYNiHVMzSFoLWAFftPsucK+Z3dbRQuWIpM8zZf1e7GihgiBoK5KWBDbFjcXONbN6TgsGNV3XY5L0ZeAset0gCahU8nFgZzMbk7PMBYGdmVxR3AP83cyey1nWF4CTga/UOH0dsJeZjc1Z5mrA7kxZv9PN7I48ZSV5KwMbA/MD09dIYmbW5xL3AcortH7B4CO94/3CzJ7PQd5BwN7AMmY2Lh3bELgMmC4lGwus0o1z812lmCQtCowBZgNuA0bj81jzAusDa+EfnVXM7Ml6+QxQ5h7AH/GHpdr/yCfAj8zs5JxkzQPcjX+wxwK30Fu/tYGFgJeBlczs1ZxkHgb8H7V9qxjwOzP7VU6yBIwCvkVvgyIrt7JvZjZ1TjILq1+QL5K+DlxqZhMLkNVDbwO3L8zMWh6JkvRvYLyZrZc5djewDHAEMA/wfeAwMzuoVXmlw8y6ZgPOACYC29U5vy3wKXBGTvI2SPLewY06RuA9tRFp/50kb4Oc5J0A9AD7A1NXnZsa+Fk6/+ec5G2X8nsW2A0Yjvdghqf9Z1P9v5GTvH2SvFHAiun/43Cv879M9/MfwBcGY/2qZE+PN5S2x3vbU2w5y9sBuB54Kz2T4/Ae9g4t5rtO2mao2m+45VCnHuDF9K4tmPdvVCVrFHB6je3i9Jz04A3h03OS9wpwYmZ//iTjmMyx64EH2lnvTm0dL0DOD89LwAUN0lwIvJSTvKvTx3KROucXSeevzkne2EZ5pTKNzUlepUc2V53zcwGvAjfnJG8M8Ghmvwc4KLO/AvAx8J3BWL9MvrvhTjgn1tl6gIk5yRI+tF3Jd0Kq84SKHODsFvKv5LF41X7DLYe6/QlXsJV6XQZsQRoJKmrDHRUcnO7rAjnlOR7vDVX2v5Hu24jMsd8B7xRZ16K2bjN+mAsP2d4Xj+EPbx6sApxnZk/XOmlmT0s6H9gmJ3nzAGc3SHMP3mPLgy8BZ5pZTU/GZvZmqt/OOclbEu/1Zpn0jJrZfZIux4cwTs9BXtH1Q9ImwKnAw3jU5mOBS4C78N9tI+B84MqcRH4P2Al/Ln6BK9mJkqYG1gWOBHaQdKuZndRE/ofiQ1xvVu23HTPbR9L+eG/we8DmwGbAS5JOBU41s5cLKEcPcEj6bY/E73ervIH3kiqshyvf/2SOTUexUcgLo9sU0xvA0g3SLEl+Lvhn7Edeb6R0efAujV3XL0j98CIDZRrc+qcvPiTf5yhb9v8Bc1adfxL/eOdBJ+q3Hz6ctoaZvS/pWOB+MzsSOFIet+AkvDeQB7vhPe11zOyjykHzeZnRktYFHgIqcgeEmY3sa7/dmNl4fJhtlKRl6VXEI4EDJF2Be5W5uoDi3EF+jZj7gS1TncbjQ763ZX9DfMj5lZzklYpu07aj8R9zh1onJW0DbIWPzebBc7hRRV+sB7RspZO4DdhW0hq1TkpaFZ83ycss/mlgi2r/hhl5U+Et1Jo9xiZ4iclbic8AX65KsxiusPKg6PqBz51dZh65ucIk+Wb2Nzyi869zkrc0cHHVB20S6fglwFJ5CJN0kKRv55HXQDGzh8xsH2A+4DvAa8CWwBWSnpX0M0kzt7EIcwJ55X8UHnXhv7g18TC8dw1A6vGuiQ9/dx3dppgOxT9aZ0u6VdKhkvaWdIikm4HzgA+Aw3KSdzGwsqQTJc2ePSFpNkl/wIf7LspJ3uHp782SzpK0m6RNJX1H0hnAren8ETnJ+wf+wbpU0mLZE8nF1AX4h+8fOcm7i8kV0VXAKpIOlLSMpB/gDYu8nP0WXT/wD1e2lTsetyLNMgZ315UH1ZaNtcgzmt0BwHI55jcgkuLZGTekmR+v239xTzNHAY9JWr4NcjfEezUP5ZGfmd2KTzlcgn9ntjWzqzJJ1sAbchfnIa90dHqSK+8NWBn3w9dD70Rs5f9HcVPxvGTNhs8V9OBDULcA/wRuxo0eeoBHgNlylLkFPhRUPcncgw8rbpmjrOmAm1Len+I9v//gPcVP0/FbgOlykrd1+o0WSvtz4r2mnqo6LjkY65dkjgX+mtl/GriiKs0pwLs5ybsryZyxzvkZ0z2+Kyd5zwIn5XW/BiB3BXwo8t30u32Ae+FePp2fBfg58BFwSxP5j66z3UKv9eZEYIui696NW8cL0LaKeYvih/iQyA+BNdskZxi+4PWDjAKsvBgnA3O0QebMwI7AMekjdgw+rj5zG2RNi6/zebKqfk+m49O2+XcchpvB/wWfvJ93MNcPuIKMlR8+PzIeWDvtL5s+rnfkJG+vVJ+78eUN06TjU+PDzHemD+peOck7DniqniLM+V7OhM+N3UVvw+VhvLdUszGIz9192ISsnjrbRLyxdCWwfrvrPFS2rlpg20kkTYuvYRqGf1geN7MJnS1VvkiahVQ/M/ug0+XJmyLqJ+mHwPH4upuXJS2NK40ZcNPnOfHhpy3MrGXLvLRo+e/AN/FhvZ6MnKmSrPPMrOa8bBPyZsV7EuOA/cwsl6GtOrLeAWbFlcMl+Lqfmxpc80vgCDMbNNMYyf1YPS8omNktxZao/XSVYpL0R+AvZvZop8vSDiT9FBhlyUVJMPhIDZg5gbfN7JN0bDV8bmYRfNjteDO7Jme538Qt9Fagt/F0H3CamZ2To5xn8CHSedOh8cDrTGlCbma2SIuyXsCH606xfno6kTQbPoqRq6uwdiBpI+D3uCVxXSwnLyhlotsUU8VtyO34MNr5lZe/G0j1G49Pyp9sZrd3uEgtIWmdZq/txlZiNyBpLP1cx2RmC7UoayrzNURtR9LO+BDgBX2k+SI+p3VmDvJWw+ev3sDf933wuevHcfdjSwH/Au4zs0NalVc2uk0xbYOvY9ggHXobH8M/xcwezyH/0fhLt4uZvZj2+4OZ2QaNkzWUvx+wJ24ybbhhxcnAWZaDl+HU2jVgQzN7Nu33h6ZavwPwP1ZL4IBbiUXXL+geMs/qhcC3zezjGmkOxj2VtNyDkXQpPge4ZBry7QFGmtmhaXj2EOCnwKpm9nCr8spGVymmCpIWwj/gu+DeEgxvbZyEr+loau4n83AuZWZPpP3+YHl2tyWNwBXw1viwyXjcGvBkM/tP3Qsb5zsWr9/66cNd2W9IM61fSSNr5L8qHkjyaXw91qv4b7gWPtR1FW5BNuBWYtH1KxOShgPfZsqhvL+b2bMdLFrLSJoet8btax6mpV5Metffws3O78StX9+sSpOnYnoduNbMvpWRf6hlFjAnp67Pmdm2rcorHZ22vmjnhq/Y3wa4ll5zztdwtyE1/dsNpg1/SfbDu/cVC6H7cUusWTpdvibqsxquZPcBpqo6NxXwI9zcd9VOl3UAdaqYog/Ul9ynOZZhv3Rfs0snKtvHwE87fZ9aqFshfgdTPgfhPZWK1ebiVWkOzkNWyutj3Eijsj8eOLoqzfHA653+DdqxdWWPqRaSVsG74RXPAj24w9ODzeyejhUsJyR9BTgNX/UO7krnDOBIGyQBBCVdB3xsZnV9GSYXM9OY2cbFlax5JN2E98q+bT78W9lviGVCHrQg/5u4f8W38fAsN9HbC10P2BfvQe1oZv9sIv+KC56LzV0s9dslj7Xei9kEN9N+GH/26/odNLNqH4wDlZUdStsZX6bxPvA188WwefeYXgAuN7O90/7zwBgz+3omzQm4F/pZW5VXOjqtGdu94Y4q/4G3tHvwHtNx9C6snABs3+lytlC/hXBPD6+k+ozHPU08nfbfY5Csr8CHlw5rkOZwclp82oeMafEhryU6fU9yqMsYfAjqC308P+OAu5vMvxnv4nn1Yq7DjQNmzcjOeqP/bnq/18pBVnXe6+HK/iNgp3Qszx7TDfhQXmX/PFwRVu7zPHgD495OP2Pt2LrNiSsAkuYAdsXnmRbH12rcji/SPN/SHFPqRV2EO3xs2FosixVZ8uG2FT7PtCE+zPU8bnJ8qpm9niZIt8ONI45mSp9ztfJt2gGl5WCJhP9OjYwMFs1BjguTvoHH6NrLeqOEVuaxFkn7l+LxmD7NSeY6wHtmdn8e+fWDpfH4YzXNo83n2s7H55+aYTe8B1hxs/SdJvNphhXxQIF1/Q4mv32/xsOR54aZ3Sj3WXklcKakhfPMHx/NOUzSnOnZ/APwdeA+SY/gBlCz4t4suo9Oa8Y8N9yM8ix8GKvSWzgRWK6Pa34DfNLP/Psda6Z6y6l+C6byvpTJ+0rgq9SJQYPHbBnfxvrlGTvoajzqb023LrhDzgn40Exe8h6oOnZJqtP1uHHARGCPHJ/RiWQCwLV7w0cIftsgzZHAq0WVKce6jQcOz+x/CBxXleYYYFwOsibrMWWOz427sZqIr9fK612YDTcEmjVz7Gu4L76PcNdde3b6N2jX1m09ppvT34fx3tGZ1ngF/0tp6w+FxZqpw7N4r+ItfDz9L9bYoupt3HKvPxTZ2q3Fr/G1G5cmp7u34B/Wz+FDsuvgL2Wenrevq+ykxZebkTwhpMWw9+P35ZScZL6J16EorgU2xt0rTUHqWW+U0g02XsUVQ4VXcO8rWYbh7pfagpm9IQ8dcjauOHL5PpjZe0weewkzu5huddpaTac1Y54bPpe0dqfL0cb6/Rsfcpm+02VpYx3XwIM51nPCu0aOsj5i8iihGyc5W2eOHQ+8lqPMfwL/LvB+zos3aM6hap4J74GfgztxnafTv30TdSvM7yAeB21YH+crQ+e75FS3qfLIZ7BuQ8YqLxhcpPH7Feldc3Ovmd2Rs4zXgX+ax/BB0hG4o9jPWVqjIulIYF8zmyknmYvhLeET8HUpufpTrLPoew7gi7iSf57eXuiCeG/iAXy4q+VF4KkM6wL74yFf5qB2eB0zs5ZGbIr2O1gkkl7CfRyeaV24gLYRoZiCIYuk2/EP9DL0etJ438xWyKQ5B1jdzIbnJPM03IBjTVxB/BcfkqrlS+67TeTfrIses3zMnDfH5+mmxpXgC/g6rloCWzKH75TfwSKQ9DbeKDPgXrw3eI4NET+ZXamYJK2MD8vUWwne1EtfQ06hLokycufF3S71Vb/f5CCnq132SNoFOB14ETeqGA78xMz+mEnzBPCkmW2ek8yOeAspiuSNYBl8OHQwzlvVJQUh/D6Nvy0tvwuSpsM9u+yCzwFOhT+jV+DrE68ws4mtyikrXaWY0kTuKOBbeBfemDw6Z2U/r9Zho49MrvKSzEOAX8JkhiuVuk76P6f6jaX2ZO7seGsO4GVgguXosqcoxZtkHYEvKwCfwP6xpZciDSfeBvzczI7JSd4X+pvWBoEH7GokfQSca2ZtN6RJyxvuN7MH+kizLLCitb6Yd3b8WVgat/adDR9ing4PtghteBeS7M/h37Rd8Hkzw41o/oEP9d2Xp7xS0OlJrjw33JVND66cVkz/H4e7uvklHlX2H9RZbJhjOYbh64vuwSeXp84p353oNWX+Wvr/NGAH3A/ghFS/dQu414vipuo3AzPkmO8huDuWKUzSydk8vR9lmS79ltMUIa8bNnzB67EFyappwl2V5td5PC+42XkPbqEpel0UKX1fxuT9LtQpxwr4vNqrqQy5ua4q0zZogmX1k13wAH27mtm96dg7ZnanmR2Jr9beBli/nYUws3fN7HrgK7iZ8345Zb03Puy0ibnpKMBYMzvXzPbCw65/A2/NtRUzewpf8Dc/vuK9ZSTtBBwI3IovfBU+bLEjbq7dA5xLm3+/Cmb2Sfotc1lc20kk7SDpeklvSfpU0jhJ10nKJUBghhuA1XPOsxWmJh8T7i3xkOynW9IQ4F13M7sTX2awJPktZaiJee/oBPy9mMDkI0JdQ7cppiXx6JlZJg15pR/1cnycuO2YT1ReCeyeU5bL4YtLsx/KSUN25pO81+AWUW3HzMbj64C+mVOWpVG87ULSgv3YPp/WVOUhT5LOwocp18fv3Ru414ANgLMlnZ2HrMQvgEUkHZCG1jvN4vhavlZZAB8BqdBDZpjZzF7HPYbkregBkDRM0vck3YEvp/gZvtzhtHbI6zTdtsAWfNy3wv9wq50sT+KTiUXxHm6WmwfT4otrK3xE71xPhYdw7+JF8SnutysPlsMtj+oqXkkVxXvZQDNPc4I9wNLWG7akP61psxZNmzOM7adMJL2Ku8w6xKpCLAyA7+FDwPfgSuNmM5soaWq8N38ksIOkW83spIFmnqwMq3kYH5LdTdL9+BB6NWbNWR1Wy9taHtKjmqnx925t3GCgVSreZCq8y5TP/Wv0OolumeR6bBN8JOiruCI0vFc6CnecW+Ri7cLoNsX0EpM/GM8wpY+4xXCF1XYkzQhsjrsqyYNX6A1ZDW6O+8WqNPNRxzw3byTNhc91vZBTlu1WvLfgL/aHVftFcia+WHNd/IN9P73ripbHDUtuwp/R5YAfAFtIWsXM3mhC3m64Mlwn+xEzt+gandYcPYQ7PB2wYsJ9UtZjeNpqYUlmK/IMv2fL9yHjP8BPmpBTzQt4r6nCI8A6mjyK7lr43E/LSDoWH8L+LD5c9wQ+fHeWDZJoAa3QbYrpLiZXRFcB+0s6EG95jsCdn16eh7A+nJ5Ogz/EO+JGArlYdOG+25bN7I8G9kyOKiv12xZ3WNsykg6qc6pSv61wxVHT3U0TtFXxmtmIvvYL4re4B48jcT9vkxpJyRz5QGAPfJ7mqbR/MH6Pf9qEvKXxAJI1W9Zm9pGkS/CeVTMUHUCxIk94w/N43MFpNRPx9U15NUJvBr4hSWmO6Z94GJErJV2Gv3ur4a7Q8uAneK/sFNwJ779zyndw0Gnrizw33O7/UWChtD8n/vBmXdu8iYcrzkNePaenlSGjT/FWzrQ5ydsVb+1X6rcAUwZJGw+slmP9+trewYeZ8vr9LsCj01b2T8AneL8NzIz3Pj8Cru/0s9ZCHS8GbmyQ5kbgosz+vfhaqmbkvU+VY9MaaY4DPuj0vWmibgfjPcEiZK2IK50F0v40eGMw+z7cCsyek7zt6WLXY422rlrHVAtJw/AWaGUl+Jlm9kqfF/U/713qnOrBJ1zHmFkuXfs+yrAQbvVXqd+JZvZgTnmvW+dUpX6PWY4Wa5J2xb3BL2MejmEBvJc4RybZBGCEuSXUoEPSW8BJZlbXekvS4Xgojs+k/ROB75jZjPWu6SOvu/DhoKWsRq8pDTc/DLxpZqsMNP+hjqQv46MiY/GYVs163ggydL1iCgY37VS8Kf9p8SHJil+3WguTzXLwFJLkfYD756ubX5rg/4aZzZL2jwL2tiYilUraC1f29+Br+W42s0+T8cM6+NDiysAPrAnjhxrytsOtK79lZi/XOD8/Ps92gpld1Kq8TL5TA3NRe0E2ZvZ8XrKC9hOKKRiySJoPN3dfkr7Xg5jl57njduBL+HDrQzXOfxG4A/dosFY6dh6wkpkNOBhdMtn+O27Sb3hvt+LgdCq83ueZWS5mzslqcm4zW7GPNGOA181ssxzkLYfP161HHaVEvlaVbaEkFqOloesqBJOsxZYCPo9bek2B5RNxtSMkM9L56bt+A46YK6li1v6SuUnxQMzcPwbeaGUoI/nmu8rMftBsHgPkWPw5OQefZK7rcDRHDsXXtt0t6e+4oUrFKm8t3LR7WjwgZGWobSOaMI8H/2oBO0m6HLfQWwFXSu/iw6Snmdk5rVSoiuVobFx0N27+3BKSlsKVOHgD46u4U9zX8DmhufD5upZ7S30YAlVj1py7rDJYjJaHTk9y5bnh7u5PwCfIc4+4Sq9Bw+KZ/f5Gev0IX0N1BDBdC3XcH3/xco+Ym6lPM/WbiL9U/wBma1L++8ARBT4vbwE3deA53QGfo6u+v5W5ux0zaYfhTkOHNylrHWD5Aus2nkyMqzppDqOfUZUb5HN2krdc2p/kogg3lvkbbum5QA6y+jICKtxdVrdv3dZjOhof334UN+d8iXxbwK20amYAFsYXOU6Fj/cPCEkjcf9cb+HWfnnX70y8Pu9W7feHGfDooTsAH9DrGHUgPIzPJRXFDFRFCS0CMzs39WC2wnsww/CF2PcBl5rZ+5m07+LePJrlRuBkCvJ2gluJLtYgzWLUXnQ7UEYAl9vkc44CMLP/SfoeHmvqN/S93qo/1AvRMTs+R7cvvpC35Xk6AEnrAO+Z2f155Dfo6LRmzHPDexL3k5N5dhvKNxU+5PBMk9e/gK9tGdbpuvRRxouAF5q8dkdc6X+xoLL+B/eE3fH71sY6vkZBTlWTvH/iowM1l2TgQ6fjgfNzkPUx8NvM/ifA76rSnAC8XEC9l0v13iqn/Cbihj4df4Y6sXWbr7yZgess56igeWE+/3I7vvK/GT4D/Mu8FV1WbsZNupvhRdxz+u2SjpG0vaR1Ja1TveVU1qOBLeWRTzuCpDmSWXy7uAkPV18Ux+Bz17dJ2lfS4pJmTn9/hK/1mZp8Fp2PA2bJ7L/JlO6/PmFK7yG5Y95ruxT4VU5ZvokruiFJV1nlSfoPvhDxW50uSzuQ9ABwjxUQ66YTZCyRKhZydR9Oyyfe1Dq4y5+Nce8B91BniMmaMCbpQ+4suC+5nYC5yVhWSVoVXzh6gPV6yG9FVltDudeRuUeSV+s3mgh838xOzUHObbh3h6+m/ctwjxlLm9nryZPGg8CHZrZsH1nlQjLr/4GZzZxDXv/EQ8aXyVN7YXSbYtoOd264gpk90eHi5E5ak/IbfLK3rQt3O0GaQ+vXA2lmh+Qgr1BFmGQOwwPOLYMPO0+HL36dOp2fCR9+O8nMWvYSrzaHcu9D7lL4vNaq+DzMO8CdwF/M7NGcZBwE/Bz4nPmc0ua49eIruLXel/HRif3M7Pg8ZDYoz8344vC5csir8AZFmegqxQQgaV88JsqJuCuXmsNeebaAi0TScfik+aH0Xb9YUNiAohVhknkUHrJgVzM7U9LBuCXZ1Jk0lwPzWR9rgQYgr2tDucsjHa8D3GDJ+3oaLjwYV4Yf4v7sDrAWPTL0sXSi4jdyD3yt2Hlm1nIYmE41KMpCNyqmg3GT6j7dtwy2l7BCcoP0e/oeN580NBSUC0lP4cPNm6b9WorpBGBbM/tcDvL6PZ9pgzCUey0yXiBet5w+cP1Y8Cp8Ocj6ZvZSTvL6w6BrUPSHrvp4Sfo/vLX0Fm4d9DIFhYAoAkm746a/n+KT2l1VvyyS1sJNqWfHe4X3mtltHS1UPnweuLBBmg/Ib8L+C3TI7LhTboLMQ3q8lnO29ZZOVNae3YWb+n+ck7yivbaXiq5STPjamWeAL5fccq1ZfobHdlrDzJ7tdGHaQXKKeRa+Jgq8JWrp3OPAzmY2pg1yi1KE7+NOVftiIdwqKw+KXsfUbzdBDKLvj5ntWrC8rui9NsugeTD6yTz45Go3KiXw1u+pXayUFsWjc86GGwiMpjdG0/q4y57r5EHznsxJZtGK8G488N+slllImynPvMBm5BQzjILNjgt2EzS6n0nNzDZoVV5QHN2mmJ7BW7yFIumruOnvUsDMZrZoOr4U/mKence4M+7poaZvvHaR/PL9gMnrVzFtXgGf9D0+JyvIA4FZge3N7PyqcyMlbQucCxyAh5tuiU4oQtws/So8wNxk3jHS83IK7pHijznJu4li1zEdgD+jK5vZg2mu5GIzOzSZb/8RV7y75iBrRIPzFYvL7ppIHwp0eoVvnhvwQ+ANYJ6C5Al3DVTxlfUBGV9ZeA/uU+AXOck7CG9pzlpQ/abDP9wT0319sap+s+Or+HMJFogr3gsapLkQdzKbh7zKb7ddnfPbpt/vjJzv68H0+lgbn/5WAj72APvnKGsxfCHqbyjAI0r1b5jqc3Bmfxo8LPmoNpZhGLAhvi7tHGDqHPIc3Y/tetzzyeG4N/i23utu3jpegFwr40NdF+A9p11xNyEL1tpykveD9OKdml6GkVQ5ccQ9IdySk7xpUv3+g7cW26qgcLP7nqQQp6pTv2uBO3OS9zGNHYAeDnyck7xCFWFVvuvh0Wxfwb0TvIGvwVk/Zzmn4T4dJ+LGMlcBp6fj2e1vOf6GZXETNGeq889zyCvrsLWeI9fq/RPaXcdu3bptKO9Zervvf+sjXV4Tr9/Fx8/3MDOTVGvI4Encs0AeVCx+hPdk8HA7U2CWj7n4TsDtZnZoklWrfs+SQwiDxBtAI/dAS5KfYcBcwGMN0jwGbJGTvEmY2Y34XEu72TXz/zxpq4Xhz3OrlMlN0DhJVwK7A0e1mN0M+DDyUnjv8zZ6w5WsjQ9hPgLsgy+ePhLYS9IYMzu9RdlDjm5TTAPxhp0HSwAnW2pS1eF13O1MHtxKsfVbCPeY3BeVoHN5MBrYUdIOZnZu9UlJ2+CLi8/OSV7RirATFG12/DQwPLN/D/AVSZ+1XjdBW+ENmiJ4jykVYzMcCKwELGtm72WOPw+cnRZFPwTsZWYHSboXeBxXiqGYBkhXKSYr2KQTn3+YoUGa+fG5p5YxsxF55DMAxtPYmGRB8glhAO7NYiv8Rf8B3qN4BW/lj8CNEd7H4/nkQdGKsHCseLPja4GfS5rZzP6Hh4HYHLhP0mRugtpdkBRkcXO8cdgqOwEXVSmlSZjZu5IuBL6FL5h+S9JV5DeaMKToKsXUAR4BRkhSrV6TpBlw6677Ci9ZPtwPbCRpOjP7pPpk8vu2Mb3mwS1hZk9J2hDv+a6Ztqwvu8eBXSw/C7m2K8J+eAyoR17DsUVzCv47zQj8z8yukPQT3OBjG9xN0O/IwepQ0s51TlXcBO2Iu/XJw5P5fDT2mj8Bt+is8CKNG65BDQbjg18mzgL+DPxe0k+zJ9Kq9+PwB3rAQQFLwl/x3sLZkiabf5A0Oz5EMQc5BUcDMLO7gaUkrYGvexlGCgNuZrfnJSfJKkIRliZEdhGeGMzsFdzrSvbYHyT9mZzdBOEOm2vlVfn9eoC/4/M/rfIS8FVJ/2dmU3hbkTQtsCVubFFhbloYTZBPIG+LN/7mp/bvZtaFa7S6zldekaQX/QpgI7yl/T5unnsxsBqulC41s691rJAtkpxJ7oq3Bt/GX7b78Ane6XHLo306VsCcKEIRdor+emIYbD205DeyFhU3QWMsJy/86o0efTOu6P5tZj1pnd8aeK96beA3ZjYyXfMI8EozikPS9MCVeM+9shYra+k0aY2WdaGvvFBMLSJpGvxB/SGTGwG8A/wJf1AHtT87SbsCPwK+SO/L8TBwXFgclZu0aPeutDuaPjwxWM5xviStTW/o+IqyvzVPGUUhaTp8jdJmuFLoodfwZyr8vbga2NrMPkkePI4DLjSzC5qQdxC+POM3+KLsN9P+X3FldSQ+hP5tc9+AXUUoppxI3e7F8Siz7wKPddsDkyaT5wDeTRPbreZ3UJOXmpn9plX5nSR9uDag7yGaluso6Wx8bifriWGkTemJYRUze6FVeUnmmvjaqEUrh+gdcnsS2M3McpmXLBpJ38a9jiyPK9z38BGEM83szBzlPIiv11sp7U/63dL+wvgc8CFmdmxecstCKKagYwzAtX81TQ1fJEVo+PDjuAEoxlwVoaRD8HnH7NBZ9uOd2xCNpJfwYadt034P/jE7JO1PAzwA3JWHVWvyPXgrPul/M+4S6VXcoGQ9PH7SR8DalkOE3m5F0ofAKWb2o7Q/ETjCzA7MpDkHN19frkPFbBuDakw56DrWK1jeSPzj/098GGZkP68zfEilZSTthK+JGY17QLgQn8S/Fh+i+S5wPu4RPA/mwnspFT4FZqrsmNmnkm4E8poHPRz/rmxlZpdVnTtE0la495LDgU1bEdRPi0fDezWP4kNxf7b8QlO0kwn4co0K7zPlesjncIOLriMU0wAYgDfjagaF5YykZ5q81MxskSYuurlJec1SUYTPV+0Xyd64GfEmSSkAjE3rqM6VdDFuUHNOTvKK9sSwBr7ep1opAWBml6Y65uEN5Ra83F/CXQC9QK83hgWAqfHe4DT4XNdqwDclrZvHUHSbeREf5q3wBLB6VZoV8N+36+g6xdRmb9gj6hyvtpipPp7reGkbvZlPxZRlnY7etRkVZ6Nz4S899Pp6Kz3VirADihHcf+M5VQYxk4bszOwaSdfgUZhrftwHSNGeGHqApxqkeRK3ZG2VbwK3466Cfpk1d5eHQj8SWBVfBvA/3Bjhu8DP8XVVdUm9sR5gaTN7YgDr0fKybrwdd0Rb4RLgMEmn4la/I9L5f+Qgq3R0lWJKljNX4T/aOLz7m20tPgvshrui6fPBrIWZTVVD3nnAsvhQz01MPp7+a9xNyTcGKqsWycBiFL66HHysPhtC/m3gCFwZ/m6g+ZvZ8Cp5s+Eek58D/g+4zcwmJjP5tYHf4spsQ3IkfVR2pipwH3BWBzwZ5M20eITlCh8xZW/lIWCvnOQV7YlhDN6D6Ysv0Wsp2Aq/A8aZ2Y7VJ5KS2lHSGNyJ7C6S9sKf221o/P5X1p99WLVfFP8AFpA03MzGAsfjDYjdgO/g7/hTDN41kn1jJfAkm9dG8d6wf4N3uWevc35OfGHeoTnJK9qb+Z/wIYTp6pyfAW/9/jHH33AP/GNdy4vzeOB7nX7OWqzf08Bpmf1HgdFVac4C3spJ3rzA9sBcmWM/whtuPbi7rCOAqXKSt1r6nfauc/4H6fddNQdZr5HxZF4nzW+B1zL7f8U9UnT8WWiivtPgSvUX6TedqdNlatfWVT0miveGvRO+TuGdWifNLb8uIPnPykFe0d7Mv4YPO9UcqjOz8ZIuBXYA9m1VmKQN8Bb9+8DRTBm4b1/gBElPmdkNTeRfBvdA9+E97AqjgT2TGfJFeG9/W3wop2WsWE8M4EN0o4E/S/oxbqFXmfdZC1+AfjWwsaTsc2o2cMvHWfEgj30xLKWrMGjnZMyHfy/sdDmKoNsUU9HesOej8fxKtf+sVijam/lnaBwxd9qULg/2x5XSl83s6czxx4GbJJ2Bz5HsTwr7MUBqDcfMgS8c7sEnzytDsQvgve4H8CHSvLgcOFHSQmb2LD4Psj0+RDsqpZlAPm506mK+xu61NmQ9MvP/YmmrZlOmtMhrxvLxMWB7SYeb2cvVJyV9Hr+3j2YOL8DkQ6lBCek2xVS0N+wXga0k/bpWryK5FdkKH87Lg0K9mePDTttKOtjM3q0+KWkOvHXfrDVfNasA51UppUmY2dOSzseHMwaMVXlnT4tc78B7KvsnRVE5txDu/HMFYJNm5NUpwyh6FRBm9oKklfE5nkWAscCJZvZgXjILpkhLx2PxYc97Jf0J72Vme2f74N+D42DSmq0N8V5cqcg4pL3YzN7vw0HtFFiOC3vLQrcppvsp0Bs2Hpr7EGC0pF/hw4gV44C18LUaC9OEoUUdivZmfhLuGeAuSYfjPY7Ki78uPqc3D17PPJiRxrGP3mByg49W+B3wtqXFp1nM7FlJ2+JGF7/DV/u3haQQf9iOvPu5xKGH3rU+F5vZmGblWYGWjmZ2tqT5cT91h1adFt6Q+7WZVcKWzI4Pqf+nqDIOgFF4r/FOfNSgst8XFYvfUEwlp2hv2EfiVk1b4v7GeiRV+8/6V0qXB4V6MzezP0taDG951vKJJ+BPZnZiHvJw67/1G6RZj951SK2yMe46pyZpHu8a3ApqsDIi/W20pAFga+CXkk4ysx+0v2itY2ZHpV70TkzpJugfZvZMJu2b5LdwOW92w3+LV9L+YH7mWqfT1hd5b/iHpgcPQ/4qbt01BrcE6sE/pHnL3BG4Dm/tT0h/rwW+mbOcqfGJ4x58ePCxVL8L8GHFHrzFm3f9Vsfj7IzBjSvG4I2ANXKW89tUnxOpsnTEJ7n/kM73aYk1AHkf4sNmfaX5C/Bhu57Xdm/4OrSL8N7QjvhQ9vTp707p+IV4g+Yr+BzeROA7nS57bEN360pfed3sDbubvZmndVP/xhcOv49bIFYC930JV06PAatZnUiiA5R3D774dHmr4cBU0hfwlvczlpxpDjYk/QYfhqwOCV45PwxfN3W6eUjwz+DGJo+b2Zr9yL8Mlo5Bl9GViqlC3t6wy0S3ejNPH8qj8Nb8TJlTH+LDtL80s1ys5CTtgC9kHIfPpVXPoe2DPz87mtk/6+VTZpKbqX+Z2Y/7SHM8sKWZLZz2zwK+amaz9yP/m2hy4amZ5WYokSzw6nlqx8xuyUtW0H66usViZh/hQ3hdh3mL4vFOlyNvzK3/vifph7h5fCWWz+Nm1ii09UBlnZss845kSgMV4cOyPxusSinR1pDgVmXpWDSSNgJ+DyzZIOmAPLUn7yNNYTlEAk5lWBdfGrEK3kCaqkayrux5dnWPKQj6Qxqy+xaTB7W7F/c5OKhdIEl6Glc8y9Ya4pWHBH8ImMaSI97kj20LM5un0MIOEEmr4b3cN/B51n1wzyeP466HlsKNj+6zFOZjAHl3dIhS0ua4f7ypcWOfF3Arw1oCO+GMuK0Mak1btDfsoul2b+bVSFoEd7h5hZlNsQhS0lx4ULvbLGNt1SpJ+eRl8l42zsJNpK+TVC8k+KJMvrh1DXxOtmlUTCDE/8PXLq5sZi9L2ge40TwIovClHD/FlzUMlDMp1jdeNSPxBsXmZnZtB8vREQZ1j0nSWJr0hm1mCxVRxlZQ/UB6Db2ZWw5B5opG0im4yfJ8tYbtUuv+JdwN1N4FF29QooJDgieZhQRClPQ6cK2ZfSvt9+B+KUdm0twNPGc11qqVGUkfAedazuHuBwu1xiwHDWY23MwWqmy45dZL+CK19YAZzGxefLx8fXxh3Yu4tV7pMbOpshtej3/h/v6+g7tgmjH93Q33wHAp/ZwfKCEjgOvrzSWl49fReK1TkDCzT8xsC9wy70Z8mHJOfK3PjcCuZraZpQXpZvaKmX2zBaVUCYR4K+4VRPhC9B3xJQc9eJiKPH7DYUy+pu0TYOaqNLfjUXMHGx8wiP36tcqgHsqrweH46u5lLeP5IVmr3SRpPeDBlK5lp6Md4EBgJbx+72SOPweMkvQvvH4Hko/T2KKZH58r6Ivn6dKone3EzM7Ch/XaTZGBEF/HjQKy+9VD9NOSn6cQACQtic9fzZLuazu4gSkDAw4ZBnWPqQZfAy61Prxh4z2Kr7dDuKRpJC0naRVJn22DiIbezPEP+7dqnW+GVKfFJa0qaeVkKNAuPqGxt+hZ6ezYf9A3ywFXWh+BEIFKIMRWeYLJFdGdeBDExQEkzYP7VXyyxrUDRtLyKb7Tw/h7Nipzbl1JH8qDeObBL4BFJB2Q5suGFN2mmNruDVvSopI2Sy6AKsck6SB8Put+fJHoK5KuSxP6eVGYN3NJW0u6Ho/8+SjuX/BO4BlJr0n6fXrx8+QhYPM0l1SrTNMBW+A+A4Ny0t9AiI2CCfaHq4F1JVUWmv8B7x3dl+aWHsM97R/fqqCk7G7ClzD8AQ9ImuUWfOgtr7msg3EFeAjwtKSLJJ1WY/tbTvLKRVEuJorY8Af+RWBYnfNz4HNQD7cg41zcE0D22J9xQ4tP8dbZXXiohB7gZWCenOr3FH0H7ps+yX+qBRmVKLm1AvWNxYcKx6f9N4C1cvz99kr5Xlx9z3DvD5ekcn2/089aWbd0/yY2sX2ak/zCAiHivetVgVkzx76WvgMfJdl75lSvs/FF3kun/YOZMkjn+cAjOf6O/dkm5iGvbFu3zTEV4Q17ZTJu81OPaG9caWxnZg+k49Ph8zy/oteFUKsU4c18Tzys+eX4XNUzKc9DcVPujfA5rW/iwfwuk7SM1YiH0wR/xYdZt8KHZB7AGxLz4wYrM+Gh3vNywtuNFB0CvJrCAiGau1j6T9Wxi/GGTd5sAFxkZn311l/A/Q3mQemthttKpzVj3hveza7XauwB/tBi/h8CR2T290h5r1cn/S345G8edZsW7zVU6jcBV7wTMvW7BF8s2ayMu+ldcJk9Pk06fmHm2PL40GKeodWnxUN9V3qclW0cvuZm2jY8M3PjvbU/AKdWHV8FmLFTz/Ng24Bd0zuyUNpfAB/izr6H43F/h63KOg34SUH1+hg4MrNfq8f0ewaxw98ybd02x4SZ/Qhv2Z9GcsCZ/v4NH3b6UYsixjO5OXZlvqpejJf/4L20ljGzCWa2NW7cMJpe0993cSuencxsa2vNietSwHXVeaT968kEgjOz+3ELq81akDcZqY6/wu/rsnhPcFlgLjM7wHJ2S5TCo4wFTsA9B2TXjXwOny/cMU+Z3YyZjTKzmSwFXTR3jrsy7qX9WrxXvLKZ3ZmDuB2BdhgZ1eI1fCFyXyyD95qCFum2oTwAzOzf+AelHTyIDwtWeDH9nZ/a1j/z44ojN8zsH7jz0XZgTO48NcsMTLlG6lFyjPA6qRBmPbTZyEHSV/AP5QN4C3hjvOdUKcNDkh7GF/0O6knmgjwx1MTaFwhxLMUpptHANyUtYWZT+KiURyHeAG/g5EZyu7Q77i5rdvxbcg/uDT6vgKflo9NdtsG24Q9JD7B72p8NNwL4J8mTRibtyngP67xOl3sA9bsT944xR9XxOdLx/1Yd/xMwrtPlbrKu1+MNi9nSfq3hmb8DT3e6rC3W8xB8KKp6WHuy/ztdzibqdRBuXDRHAbKWwC1UX8PnlE9O926ZtP8qHnpmwRxlHpb5faYweiAzpdBtW8cLMNg23MT+hvRgnA18FR8CmoC3vA/H12ickZTSR8BynS73AOq3R3rwn8R7D5VexBOpzvtXpb8RuLvT5W6yru8AJ2X2aymmI4H/dbqsLdRxp/R7Xo9brPXgw9w74EYkE/De97qdLmsTdZsW94RyP76M4HNtlrcJPvdZrdwrc6Dr5yhru5Tvs7hXl+F4T3d42n82yf5Gp3+HttzrThdgMG6425Oza7Q6q/dfBDbsdHmbqF913Sr1uRKYOpNuVryHtV+ny9xkPT8Ejs3s11JMJwHvdbqsLdTxNtxbxjRpvwc4KHN+Y3yZw1c7XdYm6lar99c2U/gkc3Y8COk5+JzZ+cB+wJw51+0WfIRirjrn58J7aTd3+ndox9aVc0ztxjzo4E6SjsFbpCvhY91T4a3wx/EW6oVm9mGnytksZraTpAvwuZV5cKuqK3Cnkj2ZdO8Dq3WkkPkwFvhygzSrMrjjXi0HnGN9eGKQVPHEcFnRhWuRWynYNN7c68of0tZOvgScaWZv1inHm5LOx5d2dB2hmFrAzO7DLf66DmvfepAycSnwc0nbmdn51SclfQdfP9VM2ISy0F9PDHsxyLAOBylsM9PgPfq++JAu/YZ3ZaWCoJ8chc+1nCNpW9IHO0XPXRtf7PskbuAxWHmFyV1UPc+U3vXno04QuqGKpKY9kls+YdyfBraQ9H/ZUYoKKZ7WZild1xGKKRiymNnbKXz1mfhkc4U/pr+3AjumodvBSmGeGLqMm2h+mDCPWGj/wBeaXyrpp2Y2aSlK8jZzNLA0g7s3X5dBHSiwFskB6ML4JCX4nM8zlvPCzAGU52jg6zYIIuaWBUnT46b29dbcYGZn5izzi3iYgc/ga0XuNLN78pTRCSTtCpwILGNmz0paAFdW2XARE4ARls+i18JpxxotSSOZUjGtilvmPY0blbyKz8GuhXs5vwq4ywYYxr2O/Olw44p16PW5+UqSNz8+n30bblzVyLHzoKNrFJOkb+DrCdZgyp7gp3iL8C+15hLaXK7TgZ0t54iykmbE11Stg1sJPgP8fbB+XCpI2g0fYpujXhIGaYTesiBpIdySbBHcAOREM3uwo4VqkgKj5a6G96L2B07IDq+lYbV98KUFI8ysnheYgcqcFvgZbh6ebdg+jZv8H9OpBne7GfSKKT0U59AbLfND3Ma/4m1hGO4QcSb8YT0f+KYVVPFWFZOkfwAXmNlFmWML4FZ/izJ5iHUDDjCz37ZQ5I4haRPcJP1h/MU7Fvf9dxc+5LQR/vtdaWZndKaUQVlI0XLPwocnTwAuxD3jX4s/L9/Fn5eTzezmFmVdB3xsHg24XporcLP8jVuRVSfvWfBv2btm9kHe+ZeNbphj2gefH/g37sX7FvOItZNI3rfXxVdSb4fHFvojTSBpoENIazQjJ8MOeFyZizLHzgAWw/3wnYp7nlgd+DFwmKRbzGwwzhnsh1uQrWFm70s6FrjfzI4Ejkx+7U6iSWOEFDOrGQY8FBQUQpHRcleh8XN3P+1xvURSRl2vkCp0Q4/pv7hJ7PKNxlrT3MX9wCdm9qUm5fXgPZOBRJVseighyRtpZoem/eWA/+KtxI2zSljSBsB1+HqjQed4VNJbeATi3dJ+D3ComY3MpLkJ+MjMNm0i/ymsm5h8HqG691k5FkOHJUTSu/garb3Sfg/wGzM7OJPmCjxeU9NWdimf94ArzOybfaT5J64kq83xgwHSDT2mxYA/9WcC0Mw+lvQvWmvVvI+30r7fz/S/xIeg8mJ1/KM5srpnaGY3SBpN6720TjEzPsFbYTxThlofg4+5N8N6NY79BDe7PRufQ6hMaK+He6++ghwioAZtocg1WncA20jawswurz4paUt8ecF1zWQu6Zkmy2XdaFjVDYrpIzz0Q3+ZE//gNct/gS/1d8w6WUXlSSXMxgN1zj+Ah/0YjLyKx0Cq8AruPDPLMJo0x63+zSTtjAd2W83M7q1KfoakP+OuYS4iKCNFrtH6Nf4sXCrpZqYMQroO/i1q1nx7KpozTx/IyM2goRsU03+A7SWdmDwx1EXSl/E5m1YmQu8H1pS0iJl1YnHbW42TMFgtdR5mckV0K7CDpLXN7FZJywLfSOny4CfAP2soJQDMbIyk81K6s3KSGeRHkdFy70lhUk5L+Y5g8iH9x4HvNvoG9ZH/8FbL2E10g2I6DFc0d0g6B7gG94SdtcpbHF9/sAPe2m4ltPrNuFeAz9O/VdeX4Ca5rbC1pOHp//nS34VxJVnN53HfdoORq4DjJc1nHqr9KNxY5SZJ4/DervDfPA+WwK0A++JlJl98G5SHy4ETJS1kHvPpSGB73DJvVEozATeKahnz+EdLSloDWJFkJQfca90cG6kDDHrjBwBJWwGn4B5361VI+Ad7DzO7tKiytUqdCXuoMgpIaYVH0LzXzLZsd9nyJq3bmBN4uzJnmNaPHEDvmpvjzeyanOS9CjzWl881SbcAS5jZ5/KQGbSXblqjlUXSrKRAgWb2XoeL03a6QjHBpB9uO3zSegl6J0HfxbvZo/H1QO93poTNIekLdU59aGZvVKVdATgO90p8etsLN8iR9DdgV+D3wCHZZyM9TyNxE/zTzWz3DhQxGMJImgZfYLs7vhazwrP4MpFjqrzGdw1do5iCYKBI+iy+/m04bm15P70T2svjFoHP4OuqXu9IIYO6SNoOX8v0rTT0W31+ftwP4gnZBeqDgeSS6GrcsMJwS+CKscfn8RGgW4GNutEl0VSdLkAQdIqkbFYB/obPt66D97rXSfunAKuGUiotuwOz11JKAGb2Ej5yMhh7uz/FDSyuAJYys+FmtnoyklgCj521dkrXdUSPKSgNmcXLjTAzy9VwJw2bLEnvhPZj3TpM0i1Iehm43Mz27CPNX/DovJ8vrmStI6myHGT5PsJe3I9/w5crsmxF0A1WeQNisHr7lvQ1vAX1KXC1mdVcyCdpF2AXM1u/wOLlxS3UVkyz45aVM+LryN7JW3BSQg/lnW/QVuYEGvVm38KNogYbi+KOA2oaP5lZj6SrcJdsXceQU0z4Qzq804XoL8nS7p/ANvSumfhxcrWys3mo5yzD8XHpQUcD67hZcSOFNfAV9kHwJu75pS8Wow0NmQL4BJilQZqZGbxrFvsk5pjKz3fwRYIv4qvKfw48AmwB3JYm8LueZDG3J95jbGUdWtA93A5sKWnJWiclLQVshRsJDDYeALaVNHetk5Lmwr8L/y20VAUx6HtMHfD2XTTfwVt8K1cm4SX9HvgdPvF5vaT1zWywLqrtN2n44kbcQKG/vgqD7uUYvPd8m6RDcSu2l/BAepsCB+IL6o9pVVBairE6cLaZvZuOzYwHYdwKD7fzOzP7Q6uyEn8GzgXuknQYcCO9gQJH4Gv75gb2zUleuTCzQb3h0R0npr/93SZ2utwDqN87wKl1zu2b6nM/MEc6dvBgql8T9+Nk3Lt4x8sSW+c3YA982Gtije0TYPec5JwLvFR17I/p/XsP+DjJ3CjHuh2R+b5Vbz3AkZ2+/+3aBn2Pic57+2430+Fra6bAzP6YLNn+CFwnacNCS1YwachmO+CpTpclKAdmdoqk2/D3f1XcUOYd4E48YvWjOYlaCe+1AJO8lOxCbxDLOXHfffvigQpbxsx+laIhfBdYgV6L0fuA08zs33nIKSPdoJg67e273bwELFjvpJn9OZk6H4f7CRyMAQIBkHRanVPTAAvgXtOnxl3OBAEASfm02zrts3gDuMJKwKx4dNzxwMuSLsV9cuaGmd2JK9khRTcopvvprLfvdvMgteMITcLMjk9BEH+Lt6wGK7s2OP8YcLSFu6WgeIzJv5drpWPZBvEbTB62JWiSblBMnfD2XSRX4t7FNzezK+olMrPfJTcmh9BcXJcysFCd4z24Y9e2hJZOSn1lfNJ8+lppzGygRjZBd/E8sFpmfyvgRTPLBvibD3g7D2Hd7G6pP4Tnh5IjaU58XuVxM7upH+l3AYab2SHtLls3IGk3PLzGHPWSEKHVhzySDsQbfRfhgUa/iXu63y+T5k5ggpmtnYO8a4C5zWzFPtKMAV43s81alVc2QjEFQxZJm+A90ofxAHDH4j3qyoT2RsD5wJVmdkZnShmUAUmz4HO4q6dD9wPrWa/p+EK4Uc5vzazl+E/d7G6pP3TDUF7QJUhapx/JKua5T5rZRy2K3A93WbOGmb0v6VjgfjM7EjhS0neBk4A/tSgnGOSkYeQ1UxRlgEdscndBhq+pGpOTyG52t9SQUExBmbiJ/s+PTUzDHT8zs8eblLcicKlNHqNrkjcUM/tbCtP9a3zBZjDEMbOa/hTNbCz5zl13s7ulhoRiCsrEobgRwqbAE8Ad9MZHWgN35HolHihtRWBzYHVJK5uH1h4oM+Or6SuMx2MwZRkD7NZE3kHQCpPcLZnZY9UnM+6WLiu8ZAUQiikoE1cDvwD2Ak6xzARocmb7PXy91npmtk9ak3Ya8CvcA8BAeZXJzXtfwWPdZBmGr50KhjjpGdwW2Jj6FpxmZhvkIK4wd0tlJIwfgtIg6To8ZPxWfaT5FzC9mW2c9m8BFjQPoDZQeVcAs5jZuml/FLAD8BUzuzXNJ9wOPGxmg83HYpAjaUnBlbhRjPAhZ2WSVPZzs+CUtAdwArUbRhOB75vZqXnIKhvhXTwoE6vgC4r74gEmX09yH+7Yshmuwie050v7R+Ev/E2S3sC9iswKHNZk/kH38At8ofthuMGBgJH42qUdgRdwf3rT5SXQzE4BvoQ7ir0HX6d5D66svtStSgliKC8oFwIWbpCmOsDjp7gDzWY4GTcHfxvAzB6RtAHuuXkRfH7peDO7psn8g+5hO+BeMzsYwEf1wMxeBc6VdBduQv5jfNlBLhTkbql0RI8pKBN3AttIqulkN6072obJfYctis8VDRgzm2Bmr5nZJ5ljd5rZFma2lJltGkopSCzC5H4oDZh20o57gLiCxm61gn4QPaagTPwaD69+laTR+IegYpW3Fj6U8jHeo0HSMOArwN87UtpgKDEBt9qs8D5T+sV7DtiysBJ1MaGYgtJgZndL2hj4G7BB2rKTzE/j8XXuTvuf4E5ra4YFCYIceRG3iKvwBL1eICqsAIwrrERdTCimoFSY2S2SFsfXLVVi0LyHGzncnjUhT54fml1cS4pl1R+zVDOzeFeGNrcD2XhnlwCHSToVuBi31tsQ+EfhJetCwlw8GLJIuonaiml2fDHvjLhl3jtm1mfokaC7kTQCt8zb28zGSpoJDxy4Mr29+qfwNXYvdaqc3UIopiCogaRZgd/jPbc1zSyXcAZB95ACdG6FG+CMBS4zsw87WqguIRRTUDokzYvPL/W1uv43BZRjKtwE+DYz+3675QVB4IRiCkqFpEOAXzL5/Gdlpf2k/4uKjyTpD8B2ZjZfw8RB15KsREf1FTBS0reA3cxs/eJK1p3EOqagNEjaCfcBdivuk0zAGfjK+lPwkBfnAkW++DNQP4hgMHQYAQxvkOYLwLptL8kQICyNgjKxN26Wu4mZfZpW1481s3Px1fUX44sYzymiMJKWxFf8P1WEvGDQMyPuiSRokVBMQZlYDjjHzLIv96QhOzO7JsVg2p8c3P1LOq3OqWmABYA1k/z96qQLhhY15z2S1/EFgc1wn3lBi4RiCsrEtHhUzgof4euYsjyEh8XIg10bnH8MONrMTs9JXjCIqLHObaSkkX1dAhzR1kINEUIxBWXiFWDezP7zwBer0sxHfsMlC9U53gO8ncJpB0OXW+hVTOvgz+PYGukm4g2qG4Cu9fhdJKGYgjJxH7BsZn80sGcKb34RPgG9LZM702waM3suj3yC7sTMRlT+T72n083s0M6VaOgQ5uJBaUgRaU8EljGzZyUtgCurrFXcBGCEmd1ZI4sgaAuSvoB7AHm302UZCoRiCkqNpIVw44NF8GGUE82sUTDB/ua9Tj+S9eC++p5MvvmCIGgzoZiCIcsAnLiCzyNcA/zMzJp2HBsMbsrilaTbCcUUDFmShdXKwKZ4GIM76I3/tAbuyPVK4FlgRTzMwThgZTN7tgNFDjpI2bySdDPh+SEYylyNe5HYC1jKzHYzs/8zs92ApYDvp/N/N7M1gd2AOYFfdarAQWcoqVeSriV6TMGQRdJ1wIdmtlUfaf4FTG9mG6f9W4AFzWx4MaUMyoCk2/BFtAsnryQ9wMiKlV4KcHkF8DUza3nx91AnekzBUGYVoJEhxQPAapn9+4B52laioKwsB1zZl1cSfA5y/6IL1o2EYgqGMgIWbpBmkar9T4GP21OcoMT01yvJlworURcTiikYytwJbCNpo1onJW0CbJPSVVgUeLWAsgXlomivJEOa8PwQDGV+jbuduSrF27mdXqu8tYD18N7RAQCShgFfAf7ekdIGnaRQryRDnTB+CIY0aZHt3+gdsjN8iA/gaWB3M7s5pZ0RnwB/zczeKbioQQcJryTFEoopGPKksAVrACvg8wbv4R+d2y1ekKAO7fRKMtQJxRQEQRCUijB+CIIgaICkZySd0OlyDBXC+CEY8oT/s6AfzA2EZ/GCiKG8YEgT/s+C/iDpTuA5M9u+02UZCsRQXjBkCf9nwQD4I/BVSdVrl4I2EEN5wVBmb+BFYJPk/wxgrJmdC5wr6WLc/9k5HSxjUA5eBK4Hbpd0MnA3vtB6iiEnM7ul4LJ1HTGUFwxZJL0LnGNme6X9HuA3ZnZwJs0VwKxm1p+ggkGXkondVVnjVvfDGcO+rRM9pmAo01//Z3sVVqKgrBxK/4NKBi0SiikYyoT/s6BfmNnITpdhKBHGD8FQppb/s7UlfVvSzJI2x40i7utI6YJgiBJzTMGQJfyfBUE5CcUUBBnC/1lQj+RTcVtgY/pejL1BoQXrQkIxBUEQNEDS9MCVeHiLygJsZZJU9mMxdg7EHFMQBEFjfoHH5zoMmAtXQiNx45gdgRfwxdjTdah8XUUopiAIgsZsB9xrZgeb2bjKQTN7NS3IXh/YAvhxh8rXVYRiCoIgaMwiTB6d1vB1cL5j9gzuJWTXYovVnYRiCoIgaMwEYHxm/33c43iW54CFCytRFxOKKQiCoDEv4pZ4FZ4AVq9KswIwjqBlQjEFQRA05nZgjcz+JcBykk6VtLmko4ENgZs6ULauI8zFgyAIGiBpBG6Zt7eZjZU0E3AjsDK9puJPAeuZ2UudKme3EIopCIKgCSRNA2wFLIovxr7MzD7saKG6hFBMQRAEQamIOaYgCIIGSBotaecGab4laXRRZepmQjEFQRA0ZgQwvEGaLwDrtr0kQ4BQTEEQBPkwIxG7KxciUGAQBEH/qDkhn7yOLwhshvvMC1okjB+CIAhqIKmHXmUkGodWF3CEmR3Q1oINAaLHFARBUJtb6FVG6wDP42bh1UwE3gJuAE4tpGRdTvSYgiAIGpB6TyPN7NBOl2UoED2mIAiCxiwEvNPpQgwVoscUBEEQlIroMQVBEPQTSfMCG+CexqevkcTM7DfFlqr7iB5TEARBP5B0CPBLJm/QZ631hCumqYsuW7cRC2yDIAgaIGkn4EDgVmBbXAmdAewInAL0AJUQ60GLxFBeEARBY/bGgwVuYmaf+ppaxprZucC5ki7GQ6uf08Eydg3RYwqCIGjMcsCVZpZ1OTRpyM7MrgGuAfYvumDdSCimIAiCxkyLL6Kt8BEwrCrNQ8CXCitRFxOKKQiCoDGvAPNm9p8HvliVZj7CiWsuhGIKgiBozH3Aspn90cDakr4taWZJm+NGEfd1pHRdRpiLB0EQNEDSrsCJwDJm9qykBXAlNEcm2QRghJnd2YEidhWhmIIgCJpA0kLAfsAiuHPXE83swY4WqksIxRQEQRCUiphjCoIgCEpFKKYgCIIGSNpO0mhJ89U5P7+kGyR9veiydSOhmIIgCBqzOzC7mb1c66SZvYSva9q90FJ1KaGYgiAIGrMcMKZBmruZcm1T0AShmIIgCBozJ/B6gzRvAXMVUJauJxRTEARBY94EFmuQZjEiym0uhGIKgiBozO3AlpKWrHVS0lLAVnhYjKBFQjEFQRA05hg8TNBtkvaVtHhyRbS4pB/hCmnqlC5okVhgGwRB0A8k7QGcQCbcRYaJwPfN7NRiS9WdhGIKgiDoJ2nI7vvAqsDs+JzSncBfzOzRzpWsuwjFFARBEJSKmGMKgiAISkUopiAIgqBUhGIKgiAISkUopmBII+mDnPPbWtLSmf1DJW2Yp4wg6HbC+CEY0kj6wMxmyTG/UcDlZnZBXnkGwVAjekxBAMg5WtJDkh6UtH3m3C/Ssf9KOjId20PS3enYhZJmkrQGsCVwtKT7JS0iaZSkbdM1G0i6L+V1mqTp0/Gxkg6RdG86V9O7QBAMFUIxBYHzdWB54EvAhrhymVfSprirmVXN7EvAUSn9RWa2cjr2KPBdM7sD+Bewv5ktb2ZPVzKXNAMwCtjezJbDvQjsnZH/ppmtCPwF+Fkb6xkEpScUUxA4awHnmNlEM3sNuBlYGVdSp5vZhwBmNi6lX1bSrZIeBHYClmmQ/xLAs2b2RNo/A1gnc/6i9PceYHirlQmCwUwopiBojlHAD1Pv5xBghhbz+zj9nYj3poJgyBKKKQicW4HtJU0taW68N3MXcB3wHUkzAUiaM6WfFXhF0rR4j6nC++lcNY8DwyUtmva/jffKgiCoIhRTEDgXAw8A/wVGAz83s1fN7Gp83miMpPvpnf85EPgPHg7hsUw+5wL7JyOHRSoHzWw88B3g/DT81wOc1N4qBcHgJMzFgyAIglIRPaYgCIKgVIRiCoIgCEpFKKYgCIKgVIRiCoIgCEpFKKYgCIKgVIRiCoIgCEpFKKYgCIKgVPw/NRexia6v7ioAAAAASUVORK5CYII=", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "# Bar\n", + "grafBar(df2.gender,df2.university[0])\n", + "grafBar(df2.career,df2.university[0])\n", + "grafBar(df2.age,df2.university[0])\n", + "# Pie\n", + "grafPie(df2,df2.age,df2.university[0])\n", + "grafPie(df2,df2.gender,df2.university[0])\n", + "grafPie(df2,df2.inscmonth,df2.university[0])\n", + "# Box\n", + "grafBox(df2.gender,df2.age,df2.university[0])\n", + "grafBox(df2.career,df2.age,df2.university[0])\n", + "\n", + "# Location \n", + "grafLocation(df2)\n" + ] + }, + { + "cell_type": "code", + "execution_count": 117, + "id": "3c3dc323", + "metadata": {}, + "outputs": [], + "source": [ + "dfg1=pd.get_dummies(data=dfg, columns=['career'])\n", + "dft2=pd.get_dummies(data=dft, columns=['career'])" + ] + }, + { + "cell_type": "code", + "execution_count": 118, + "id": "1131994a", + "metadata": {}, + "outputs": [], + "source": [ + "# dfg1" + ] + }, + { + "cell_type": "code", + "execution_count": 119, + "id": "4f8c71a8", + "metadata": {}, + "outputs": [], + "source": [ + "# dft2" + ] + }, + { + "cell_type": "code", + "execution_count": 120, + "id": "81f731e1", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
gender_femalegender_malecareer_actuariocareer_agronomíacareer_arquitecturacareer_bioquímicacareer_ciencias veterinariascareer_contador públicocareer_diseño de imagen y sonidocareer_diseño industrial...career_licenciatura en kinesiología y fisiatríacareer_licenciatura en musicoterapiacareer_licenciatura en planificación y diseño del paisajecareer_licenciatura en producción de bioimagenescareer_licenciatura en psicologíacareer_licenciatura en relaciones del trabajocareer_licenciatura en sociologíacareer_licenciatura en terapia ocupacionalcareer_medicinacareer_técnico para bioterios
gender_female1.000000-1.0000000.023637-0.0252870.0187230.0218760.002190-0.011613-0.0250600.019797...-0.0013010.0141500.0113610.0459330.0020170.037637-0.022677-0.0206360.0025420.031490
gender_male-1.0000001.000000-0.0236370.025287-0.018723-0.021876-0.0021900.0116130.025060-0.019797...0.001301-0.014150-0.011361-0.045933-0.002017-0.0376370.0226770.020636-0.002542-0.031490
career_actuario0.023637-0.0236371.000000-0.030460-0.031423-0.031739-0.032362-0.030460-0.034463-0.036459...-0.030784-0.035899-0.035043-0.033577-0.029801-0.029130-0.033577-0.032052-0.037559-0.032052
career_agronomía-0.0252870.025287-0.0304601.000000-0.027773-0.028052-0.028602-0.026921-0.030460-0.032224...-0.027208-0.031728-0.030972-0.029676-0.026339-0.025746-0.029676-0.028328-0.033195-0.028328
career_arquitectura0.018723-0.018723-0.031423-0.0277731.000000-0.028939-0.029507-0.027773-0.031423-0.033243...-0.028069-0.032732-0.031952-0.030615-0.027173-0.026561-0.030615-0.029225-0.034246-0.029225
career_bioquímica0.021876-0.021876-0.031739-0.028052-0.0289391.000000-0.029803-0.028052-0.031739-0.033577...-0.028350-0.033061-0.032273-0.030922-0.027446-0.026827-0.030922-0.029518-0.034590-0.029518
career_ciencias veterinarias0.002190-0.002190-0.032362-0.028602-0.029507-0.0298031.000000-0.028602-0.032362-0.034236...-0.028907-0.033710-0.032907-0.031529-0.027984-0.027354-0.031529-0.030097-0.035268-0.030097
career_contador público-0.0116130.011613-0.030460-0.026921-0.027773-0.028052-0.0286021.000000-0.030460-0.032224...-0.027208-0.031728-0.030972-0.029676-0.026339-0.025746-0.029676-0.028328-0.033195-0.028328
career_diseño de imagen y sonido-0.0250600.025060-0.034463-0.030460-0.031423-0.031739-0.032362-0.0304601.000000-0.036459...-0.030784-0.035899-0.035043-0.033577-0.029801-0.029130-0.033577-0.032052-0.037559-0.032052
career_diseño industrial0.019797-0.019797-0.036459-0.032224-0.033243-0.033577-0.034236-0.032224-0.0364591.000000...-0.032567-0.037978-0.037073-0.035521-0.031527-0.030817-0.035521-0.033908-0.039734-0.033908
career_farmacia-0.0314080.031408-0.031105-0.027491-0.028361-0.028646-0.029208-0.027491-0.031105-0.032906...-0.027784-0.032401-0.031629-0.030305-0.026898-0.026292-0.030305-0.028928-0.033899-0.028928
career_ingeniería electrónica0.016237-0.016237-0.029130-0.025746-0.026561-0.026827-0.027354-0.025746-0.029130-0.030817...-0.026020-0.030343-0.029621-0.028381-0.025190-0.024622-0.028381-0.027092-0.031747-0.027092
career_ingeniería en informática-0.0160950.016095-0.034170-0.030200-0.031156-0.031469-0.032086-0.030200-0.034170-0.036149...-0.030522-0.035593-0.034745-0.033291-0.029548-0.028882-0.033291-0.031779-0.037239-0.031779
career_ingeniería mecánica0.014747-0.014747-0.033577-0.029676-0.030615-0.030922-0.031529-0.029676-0.033577-0.035521...-0.029992-0.034975-0.034142-0.032713-0.029035-0.028381-0.032713-0.031227-0.036593-0.031227
career_licenciatura en administración-0.0250600.025060-0.034463-0.030460-0.031423-0.031739-0.032362-0.030460-0.034463-0.036459...-0.030784-0.035899-0.035043-0.033577-0.029801-0.029130-0.033577-0.032052-0.037559-0.032052
career_licenciatura en artes-0.0459650.045965-0.034754-0.030717-0.031689-0.032007-0.032635-0.030717-0.034754-0.036767...-0.031044-0.036202-0.035340-0.033860-0.030053-0.029376-0.033860-0.032322-0.037876-0.032322
career_licenciatura en ciencia política0.035334-0.035334-0.035043-0.030972-0.031952-0.032273-0.032907-0.030972-0.035043-0.037073...-0.031302-0.036503-0.035633-0.034142-0.030303-0.029621-0.034142-0.032591-0.038191-0.032591
career_licenciatura en ciencia y tecnología de alimentos0.008575-0.008575-0.032974-0.029143-0.030066-0.030367-0.030963-0.029143-0.032974-0.034884...-0.029454-0.034347-0.033529-0.032126-0.028514-0.027871-0.032126-0.030667-0.035936-0.030667
career_licenciatura en ciencias ambientales0.043898-0.043898-0.029801-0.026339-0.027173-0.027446-0.027984-0.026339-0.029801-0.031527...-0.026620-0.031043-0.030303-0.029035-0.025770-0.025190-0.029035-0.027716-0.032478-0.027716
career_licenciatura en ciencias antropológicas0.005411-0.005411-0.032669-0.028874-0.029788-0.030087-0.030677-0.028874-0.032669-0.034561...-0.029181-0.034030-0.033219-0.031829-0.028250-0.027614-0.031829-0.030383-0.035604-0.030383
career_licenciatura en ciencias biológicas-0.0338850.033885-0.034754-0.030717-0.031689-0.032007-0.032635-0.030717-0.034754-0.036767...-0.031044-0.036202-0.035340-0.033860-0.030053-0.029376-0.033860-0.032322-0.037876-0.032322
career_licenciatura en ciencias de la computación-0.0241570.024157-0.031739-0.028052-0.028939-0.029230-0.029803-0.028052-0.031739-0.033577...-0.028350-0.033061-0.032273-0.030922-0.027446-0.026827-0.030922-0.029518-0.034590-0.029518
career_licenciatura en ciencias de la educación0.025774-0.025774-0.030784-0.027208-0.028069-0.028350-0.028907-0.027208-0.030784-0.032567...-0.027497-0.032066-0.031302-0.029992-0.026620-0.026020-0.029992-0.028630-0.033549-0.028630
career_licenciatura en ciencias geológicas-0.0512130.051213-0.033277-0.029411-0.030341-0.030646-0.031247-0.029411-0.033277-0.035204...-0.029724-0.034663-0.033837-0.032421-0.028775-0.028127-0.032421-0.030948-0.036266-0.030948
career_licenciatura en gestión de agroalimentos-0.0410240.041024-0.031423-0.027773-0.028652-0.028939-0.029507-0.027773-0.031423-0.033243...-0.028069-0.032732-0.031952-0.030615-0.027173-0.026561-0.030615-0.029225-0.034246-0.029225
career_licenciatura en kinesiología y fisiatría-0.0013010.001301-0.030784-0.027208-0.028069-0.028350-0.028907-0.027208-0.030784-0.032567...1.000000-0.032066-0.031302-0.029992-0.026620-0.026020-0.029992-0.028630-0.033549-0.028630
career_licenciatura en musicoterapia0.014150-0.014150-0.035899-0.031728-0.032732-0.033061-0.033710-0.031728-0.035899-0.037978...-0.0320661.000000-0.036503-0.034975-0.031043-0.030343-0.034975-0.033387-0.039123-0.033387
career_licenciatura en planificación y diseño del paisaje0.011361-0.011361-0.035043-0.030972-0.031952-0.032273-0.032907-0.030972-0.035043-0.037073...-0.031302-0.0365031.000000-0.034142-0.030303-0.029621-0.034142-0.032591-0.038191-0.032591
career_licenciatura en producción de bioimagenes0.045933-0.045933-0.033577-0.029676-0.030615-0.030922-0.031529-0.029676-0.033577-0.035521...-0.029992-0.034975-0.0341421.000000-0.029035-0.028381-0.032713-0.031227-0.036593-0.031227
career_licenciatura en psicología0.002017-0.002017-0.029801-0.026339-0.027173-0.027446-0.027984-0.026339-0.029801-0.031527...-0.026620-0.031043-0.030303-0.0290351.000000-0.025190-0.029035-0.027716-0.032478-0.027716
career_licenciatura en relaciones del trabajo0.037637-0.037637-0.029130-0.025746-0.026561-0.026827-0.027354-0.025746-0.029130-0.030817...-0.026020-0.030343-0.029621-0.028381-0.0251901.000000-0.028381-0.027092-0.031747-0.027092
career_licenciatura en sociología-0.0226770.022677-0.033577-0.029676-0.030615-0.030922-0.031529-0.029676-0.033577-0.035521...-0.029992-0.034975-0.034142-0.032713-0.029035-0.0283811.000000-0.031227-0.036593-0.031227
career_licenciatura en terapia ocupacional-0.0206360.020636-0.032052-0.028328-0.029225-0.029518-0.030097-0.028328-0.032052-0.033908...-0.028630-0.033387-0.032591-0.031227-0.027716-0.027092-0.0312271.000000-0.034931-0.029809
career_medicina0.002542-0.002542-0.037559-0.033195-0.034246-0.034590-0.035268-0.033195-0.037559-0.039734...-0.033549-0.039123-0.038191-0.036593-0.032478-0.031747-0.036593-0.0349311.000000-0.034931
career_técnico para bioterios0.031490-0.031490-0.032052-0.028328-0.029225-0.029518-0.030097-0.028328-0.032052-0.033908...-0.028630-0.033387-0.032591-0.031227-0.027716-0.027092-0.031227-0.029809-0.0349311.000000
\n", + "

35 rows × 35 columns

\n", + "
" + ], + "text/plain": [ + " gender_female \\\n", + "gender_female 1.000000 \n", + "gender_male -1.000000 \n", + "career_actuario 0.023637 \n", + "career_agronomía -0.025287 \n", + "career_arquitectura 0.018723 \n", + "career_bioquímica 0.021876 \n", + "career_ciencias veterinarias 0.002190 \n", + "career_contador público -0.011613 \n", + "career_diseño de imagen y sonido -0.025060 \n", + "career_diseño industrial 0.019797 \n", + "career_farmacia -0.031408 \n", + "career_ingeniería electrónica 0.016237 \n", + "career_ingeniería en informática -0.016095 \n", + "career_ingeniería mecánica 0.014747 \n", + "career_licenciatura en administración -0.025060 \n", + "career_licenciatura en artes -0.045965 \n", + "career_licenciatura en ciencia política 0.035334 \n", + "career_licenciatura en ciencia y tecnología de ... 0.008575 \n", + "career_licenciatura en ciencias ambientales 0.043898 \n", + "career_licenciatura en ciencias antropológicas 0.005411 \n", + "career_licenciatura en ciencias biológicas -0.033885 \n", + "career_licenciatura en ciencias de la computación -0.024157 \n", + "career_licenciatura en ciencias de la educación 0.025774 \n", + "career_licenciatura en ciencias geológicas -0.051213 \n", + "career_licenciatura en gestión de agroalimentos -0.041024 \n", + "career_licenciatura en kinesiología y fisiatría -0.001301 \n", + "career_licenciatura en musicoterapia 0.014150 \n", + "career_licenciatura en planificación y diseño d... 0.011361 \n", + "career_licenciatura en producción de bioimagenes 0.045933 \n", + "career_licenciatura en psicología 0.002017 \n", + "career_licenciatura en relaciones del trabajo 0.037637 \n", + "career_licenciatura en sociología -0.022677 \n", + "career_licenciatura en terapia ocupacional -0.020636 \n", + "career_medicina 0.002542 \n", + "career_técnico para bioterios 0.031490 \n", + "\n", + " gender_male \\\n", + "gender_female -1.000000 \n", + "gender_male 1.000000 \n", + "career_actuario -0.023637 \n", + "career_agronomía 0.025287 \n", + "career_arquitectura -0.018723 \n", + "career_bioquímica -0.021876 \n", + "career_ciencias veterinarias -0.002190 \n", + "career_contador público 0.011613 \n", + "career_diseño de imagen y sonido 0.025060 \n", + "career_diseño industrial -0.019797 \n", + "career_farmacia 0.031408 \n", + "career_ingeniería electrónica -0.016237 \n", + "career_ingeniería en informática 0.016095 \n", + "career_ingeniería mecánica -0.014747 \n", + "career_licenciatura en administración 0.025060 \n", + "career_licenciatura en artes 0.045965 \n", + "career_licenciatura en ciencia política -0.035334 \n", + "career_licenciatura en ciencia y tecnología de ... -0.008575 \n", + "career_licenciatura en ciencias ambientales -0.043898 \n", + "career_licenciatura en ciencias antropológicas -0.005411 \n", + "career_licenciatura en ciencias biológicas 0.033885 \n", + "career_licenciatura en ciencias de la computación 0.024157 \n", + "career_licenciatura en ciencias de la educación -0.025774 \n", + "career_licenciatura en ciencias geológicas 0.051213 \n", + "career_licenciatura en gestión de agroalimentos 0.041024 \n", + "career_licenciatura en kinesiología y fisiatría 0.001301 \n", + "career_licenciatura en musicoterapia -0.014150 \n", + "career_licenciatura en planificación y diseño d... -0.011361 \n", + "career_licenciatura en producción de bioimagenes -0.045933 \n", + "career_licenciatura en psicología -0.002017 \n", + "career_licenciatura en relaciones del trabajo -0.037637 \n", + "career_licenciatura en sociología 0.022677 \n", + "career_licenciatura en terapia ocupacional 0.020636 \n", + "career_medicina -0.002542 \n", + "career_técnico para bioterios -0.031490 \n", + "\n", + " career_actuario \\\n", + "gender_female 0.023637 \n", + "gender_male -0.023637 \n", + "career_actuario 1.000000 \n", + "career_agronomía -0.030460 \n", + "career_arquitectura -0.031423 \n", + "career_bioquímica -0.031739 \n", + "career_ciencias veterinarias -0.032362 \n", + "career_contador público -0.030460 \n", + "career_diseño de imagen y sonido -0.034463 \n", + "career_diseño industrial -0.036459 \n", + "career_farmacia -0.031105 \n", + "career_ingeniería electrónica -0.029130 \n", + "career_ingeniería en informática -0.034170 \n", + "career_ingeniería mecánica -0.033577 \n", + "career_licenciatura en administración -0.034463 \n", + "career_licenciatura en artes -0.034754 \n", + "career_licenciatura en ciencia política -0.035043 \n", + "career_licenciatura en ciencia y tecnología de ... -0.032974 \n", + "career_licenciatura en ciencias ambientales -0.029801 \n", + "career_licenciatura en ciencias antropológicas -0.032669 \n", + "career_licenciatura en ciencias biológicas -0.034754 \n", + "career_licenciatura en ciencias de la computación -0.031739 \n", + "career_licenciatura en ciencias de la educación -0.030784 \n", + "career_licenciatura en ciencias geológicas -0.033277 \n", + "career_licenciatura en gestión de agroalimentos -0.031423 \n", + "career_licenciatura en kinesiología y fisiatría -0.030784 \n", + "career_licenciatura en musicoterapia -0.035899 \n", + "career_licenciatura en planificación y diseño d... -0.035043 \n", + "career_licenciatura en producción de bioimagenes -0.033577 \n", + "career_licenciatura en psicología -0.029801 \n", + "career_licenciatura en relaciones del trabajo -0.029130 \n", + "career_licenciatura en sociología -0.033577 \n", + "career_licenciatura en terapia ocupacional -0.032052 \n", + "career_medicina -0.037559 \n", + "career_técnico para bioterios -0.032052 \n", + "\n", + " career_agronomía \\\n", + "gender_female -0.025287 \n", + "gender_male 0.025287 \n", + "career_actuario -0.030460 \n", + "career_agronomía 1.000000 \n", + "career_arquitectura -0.027773 \n", + "career_bioquímica -0.028052 \n", + "career_ciencias veterinarias -0.028602 \n", + "career_contador público -0.026921 \n", + "career_diseño de imagen y sonido -0.030460 \n", + "career_diseño industrial -0.032224 \n", + "career_farmacia -0.027491 \n", + "career_ingeniería electrónica -0.025746 \n", + "career_ingeniería en informática -0.030200 \n", + "career_ingeniería mecánica -0.029676 \n", + "career_licenciatura en administración -0.030460 \n", + "career_licenciatura en artes -0.030717 \n", + "career_licenciatura en ciencia política -0.030972 \n", + "career_licenciatura en ciencia y tecnología de ... -0.029143 \n", + "career_licenciatura en ciencias ambientales -0.026339 \n", + "career_licenciatura en ciencias antropológicas -0.028874 \n", + "career_licenciatura en ciencias biológicas -0.030717 \n", + "career_licenciatura en ciencias de la computación -0.028052 \n", + "career_licenciatura en ciencias de la educación -0.027208 \n", + "career_licenciatura en ciencias geológicas -0.029411 \n", + "career_licenciatura en gestión de agroalimentos -0.027773 \n", + "career_licenciatura en kinesiología y fisiatría -0.027208 \n", + "career_licenciatura en musicoterapia -0.031728 \n", + "career_licenciatura en planificación y diseño d... -0.030972 \n", + "career_licenciatura en producción de bioimagenes -0.029676 \n", + "career_licenciatura en psicología -0.026339 \n", + "career_licenciatura en relaciones del trabajo -0.025746 \n", + "career_licenciatura en sociología -0.029676 \n", + "career_licenciatura en terapia ocupacional -0.028328 \n", + "career_medicina -0.033195 \n", + "career_técnico para bioterios -0.028328 \n", + "\n", + " career_arquitectura \\\n", + "gender_female 0.018723 \n", + "gender_male -0.018723 \n", + "career_actuario -0.031423 \n", + "career_agronomía -0.027773 \n", + "career_arquitectura 1.000000 \n", + "career_bioquímica -0.028939 \n", + "career_ciencias veterinarias -0.029507 \n", + "career_contador público -0.027773 \n", + "career_diseño de imagen y sonido -0.031423 \n", + "career_diseño industrial -0.033243 \n", + "career_farmacia -0.028361 \n", + "career_ingeniería electrónica -0.026561 \n", + "career_ingeniería en informática -0.031156 \n", + "career_ingeniería mecánica -0.030615 \n", + "career_licenciatura en administración -0.031423 \n", + "career_licenciatura en artes -0.031689 \n", + "career_licenciatura en ciencia política -0.031952 \n", + "career_licenciatura en ciencia y tecnología de ... -0.030066 \n", + "career_licenciatura en ciencias ambientales -0.027173 \n", + "career_licenciatura en ciencias antropológicas -0.029788 \n", + "career_licenciatura en ciencias biológicas -0.031689 \n", + "career_licenciatura en ciencias de la computación -0.028939 \n", + "career_licenciatura en ciencias de la educación -0.028069 \n", + "career_licenciatura en ciencias geológicas -0.030341 \n", + "career_licenciatura en gestión de agroalimentos -0.028652 \n", + "career_licenciatura en kinesiología y fisiatría -0.028069 \n", + "career_licenciatura en musicoterapia -0.032732 \n", + "career_licenciatura en planificación y diseño d... -0.031952 \n", + "career_licenciatura en producción de bioimagenes -0.030615 \n", + "career_licenciatura en psicología -0.027173 \n", + "career_licenciatura en relaciones del trabajo -0.026561 \n", + "career_licenciatura en sociología -0.030615 \n", + "career_licenciatura en terapia ocupacional -0.029225 \n", + "career_medicina -0.034246 \n", + "career_técnico para bioterios -0.029225 \n", + "\n", + " career_bioquímica \\\n", + "gender_female 0.021876 \n", + "gender_male -0.021876 \n", + "career_actuario -0.031739 \n", + "career_agronomía -0.028052 \n", + "career_arquitectura -0.028939 \n", + "career_bioquímica 1.000000 \n", + "career_ciencias veterinarias -0.029803 \n", + "career_contador público -0.028052 \n", + "career_diseño de imagen y sonido -0.031739 \n", + "career_diseño industrial -0.033577 \n", + "career_farmacia -0.028646 \n", + "career_ingeniería electrónica -0.026827 \n", + "career_ingeniería en informática -0.031469 \n", + "career_ingeniería mecánica -0.030922 \n", + "career_licenciatura en administración -0.031739 \n", + "career_licenciatura en artes -0.032007 \n", + "career_licenciatura en ciencia política -0.032273 \n", + "career_licenciatura en ciencia y tecnología de ... -0.030367 \n", + "career_licenciatura en ciencias ambientales -0.027446 \n", + "career_licenciatura en ciencias antropológicas -0.030087 \n", + "career_licenciatura en ciencias biológicas -0.032007 \n", + "career_licenciatura en ciencias de la computación -0.029230 \n", + "career_licenciatura en ciencias de la educación -0.028350 \n", + "career_licenciatura en ciencias geológicas -0.030646 \n", + "career_licenciatura en gestión de agroalimentos -0.028939 \n", + "career_licenciatura en kinesiología y fisiatría -0.028350 \n", + "career_licenciatura en musicoterapia -0.033061 \n", + "career_licenciatura en planificación y diseño d... -0.032273 \n", + "career_licenciatura en producción de bioimagenes -0.030922 \n", + "career_licenciatura en psicología -0.027446 \n", + "career_licenciatura en relaciones del trabajo -0.026827 \n", + "career_licenciatura en sociología -0.030922 \n", + "career_licenciatura en terapia ocupacional -0.029518 \n", + "career_medicina -0.034590 \n", + "career_técnico para bioterios -0.029518 \n", + "\n", + " career_ciencias veterinarias \\\n", + "gender_female 0.002190 \n", + "gender_male -0.002190 \n", + "career_actuario -0.032362 \n", + "career_agronomía -0.028602 \n", + "career_arquitectura -0.029507 \n", + "career_bioquímica -0.029803 \n", + "career_ciencias veterinarias 1.000000 \n", + "career_contador público -0.028602 \n", + "career_diseño de imagen y sonido -0.032362 \n", + "career_diseño industrial -0.034236 \n", + "career_farmacia -0.029208 \n", + "career_ingeniería electrónica -0.027354 \n", + "career_ingeniería en informática -0.032086 \n", + "career_ingeniería mecánica -0.031529 \n", + "career_licenciatura en administración -0.032362 \n", + "career_licenciatura en artes -0.032635 \n", + "career_licenciatura en ciencia política -0.032907 \n", + "career_licenciatura en ciencia y tecnología de ... -0.030963 \n", + "career_licenciatura en ciencias ambientales -0.027984 \n", + "career_licenciatura en ciencias antropológicas -0.030677 \n", + "career_licenciatura en ciencias biológicas -0.032635 \n", + "career_licenciatura en ciencias de la computación -0.029803 \n", + "career_licenciatura en ciencias de la educación -0.028907 \n", + "career_licenciatura en ciencias geológicas -0.031247 \n", + "career_licenciatura en gestión de agroalimentos -0.029507 \n", + "career_licenciatura en kinesiología y fisiatría -0.028907 \n", + "career_licenciatura en musicoterapia -0.033710 \n", + "career_licenciatura en planificación y diseño d... -0.032907 \n", + "career_licenciatura en producción de bioimagenes -0.031529 \n", + "career_licenciatura en psicología -0.027984 \n", + "career_licenciatura en relaciones del trabajo -0.027354 \n", + "career_licenciatura en sociología -0.031529 \n", + "career_licenciatura en terapia ocupacional -0.030097 \n", + "career_medicina -0.035268 \n", + "career_técnico para bioterios -0.030097 \n", + "\n", + " career_contador público \\\n", + "gender_female -0.011613 \n", + "gender_male 0.011613 \n", + "career_actuario -0.030460 \n", + "career_agronomía -0.026921 \n", + "career_arquitectura -0.027773 \n", + "career_bioquímica -0.028052 \n", + "career_ciencias veterinarias -0.028602 \n", + "career_contador público 1.000000 \n", + "career_diseño de imagen y sonido -0.030460 \n", + "career_diseño industrial -0.032224 \n", + "career_farmacia -0.027491 \n", + "career_ingeniería electrónica -0.025746 \n", + "career_ingeniería en informática -0.030200 \n", + "career_ingeniería mecánica -0.029676 \n", + "career_licenciatura en administración -0.030460 \n", + "career_licenciatura en artes -0.030717 \n", + "career_licenciatura en ciencia política -0.030972 \n", + "career_licenciatura en ciencia y tecnología de ... -0.029143 \n", + "career_licenciatura en ciencias ambientales -0.026339 \n", + "career_licenciatura en ciencias antropológicas -0.028874 \n", + "career_licenciatura en ciencias biológicas -0.030717 \n", + "career_licenciatura en ciencias de la computación -0.028052 \n", + "career_licenciatura en ciencias de la educación -0.027208 \n", + "career_licenciatura en ciencias geológicas -0.029411 \n", + "career_licenciatura en gestión de agroalimentos -0.027773 \n", + "career_licenciatura en kinesiología y fisiatría -0.027208 \n", + "career_licenciatura en musicoterapia -0.031728 \n", + "career_licenciatura en planificación y diseño d... -0.030972 \n", + "career_licenciatura en producción de bioimagenes -0.029676 \n", + "career_licenciatura en psicología -0.026339 \n", + "career_licenciatura en relaciones del trabajo -0.025746 \n", + "career_licenciatura en sociología -0.029676 \n", + "career_licenciatura en terapia ocupacional -0.028328 \n", + "career_medicina -0.033195 \n", + "career_técnico para bioterios -0.028328 \n", + "\n", + " career_diseño de imagen y sonido \\\n", + "gender_female -0.025060 \n", + "gender_male 0.025060 \n", + "career_actuario -0.034463 \n", + "career_agronomía -0.030460 \n", + "career_arquitectura -0.031423 \n", + "career_bioquímica -0.031739 \n", + "career_ciencias veterinarias -0.032362 \n", + "career_contador público -0.030460 \n", + "career_diseño de imagen y sonido 1.000000 \n", + "career_diseño industrial -0.036459 \n", + "career_farmacia -0.031105 \n", + "career_ingeniería electrónica -0.029130 \n", + "career_ingeniería en informática -0.034170 \n", + "career_ingeniería mecánica -0.033577 \n", + "career_licenciatura en administración -0.034463 \n", + "career_licenciatura en artes -0.034754 \n", + "career_licenciatura en ciencia política -0.035043 \n", + "career_licenciatura en ciencia y tecnología de ... -0.032974 \n", + "career_licenciatura en ciencias ambientales -0.029801 \n", + "career_licenciatura en ciencias antropológicas -0.032669 \n", + "career_licenciatura en ciencias biológicas -0.034754 \n", + "career_licenciatura en ciencias de la computación -0.031739 \n", + "career_licenciatura en ciencias de la educación -0.030784 \n", + "career_licenciatura en ciencias geológicas -0.033277 \n", + "career_licenciatura en gestión de agroalimentos -0.031423 \n", + "career_licenciatura en kinesiología y fisiatría -0.030784 \n", + "career_licenciatura en musicoterapia -0.035899 \n", + "career_licenciatura en planificación y diseño d... -0.035043 \n", + "career_licenciatura en producción de bioimagenes -0.033577 \n", + "career_licenciatura en psicología -0.029801 \n", + "career_licenciatura en relaciones del trabajo -0.029130 \n", + "career_licenciatura en sociología -0.033577 \n", + "career_licenciatura en terapia ocupacional -0.032052 \n", + "career_medicina -0.037559 \n", + "career_técnico para bioterios -0.032052 \n", + "\n", + " career_diseño industrial \\\n", + "gender_female 0.019797 \n", + "gender_male -0.019797 \n", + "career_actuario -0.036459 \n", + "career_agronomía -0.032224 \n", + "career_arquitectura -0.033243 \n", + "career_bioquímica -0.033577 \n", + "career_ciencias veterinarias -0.034236 \n", + "career_contador público -0.032224 \n", + "career_diseño de imagen y sonido -0.036459 \n", + "career_diseño industrial 1.000000 \n", + "career_farmacia -0.032906 \n", + "career_ingeniería electrónica -0.030817 \n", + "career_ingeniería en informática -0.036149 \n", + "career_ingeniería mecánica -0.035521 \n", + "career_licenciatura en administración -0.036459 \n", + "career_licenciatura en artes -0.036767 \n", + "career_licenciatura en ciencia política -0.037073 \n", + "career_licenciatura en ciencia y tecnología de ... -0.034884 \n", + "career_licenciatura en ciencias ambientales -0.031527 \n", + "career_licenciatura en ciencias antropológicas -0.034561 \n", + "career_licenciatura en ciencias biológicas -0.036767 \n", + "career_licenciatura en ciencias de la computación -0.033577 \n", + "career_licenciatura en ciencias de la educación -0.032567 \n", + "career_licenciatura en ciencias geológicas -0.035204 \n", + "career_licenciatura en gestión de agroalimentos -0.033243 \n", + "career_licenciatura en kinesiología y fisiatría -0.032567 \n", + "career_licenciatura en musicoterapia -0.037978 \n", + "career_licenciatura en planificación y diseño d... -0.037073 \n", + "career_licenciatura en producción de bioimagenes -0.035521 \n", + "career_licenciatura en psicología -0.031527 \n", + "career_licenciatura en relaciones del trabajo -0.030817 \n", + "career_licenciatura en sociología -0.035521 \n", + "career_licenciatura en terapia ocupacional -0.033908 \n", + "career_medicina -0.039734 \n", + "career_técnico para bioterios -0.033908 \n", + "\n", + " ... \\\n", + "gender_female ... \n", + "gender_male ... \n", + "career_actuario ... \n", + "career_agronomía ... \n", + "career_arquitectura ... \n", + "career_bioquímica ... \n", + "career_ciencias veterinarias ... \n", + "career_contador público ... \n", + "career_diseño de imagen y sonido ... \n", + "career_diseño industrial ... \n", + "career_farmacia ... \n", + "career_ingeniería electrónica ... \n", + "career_ingeniería en informática ... \n", + "career_ingeniería mecánica ... \n", + "career_licenciatura en administración ... \n", + "career_licenciatura en artes ... \n", + "career_licenciatura en ciencia política ... \n", + "career_licenciatura en ciencia y tecnología de ... ... \n", + "career_licenciatura en ciencias ambientales ... \n", + "career_licenciatura en ciencias antropológicas ... \n", + "career_licenciatura en ciencias biológicas ... \n", + "career_licenciatura en ciencias de la computación ... \n", + "career_licenciatura en ciencias de la educación ... \n", + "career_licenciatura en ciencias geológicas ... \n", + "career_licenciatura en gestión de agroalimentos ... \n", + "career_licenciatura en kinesiología y fisiatría ... \n", + "career_licenciatura en musicoterapia ... \n", + "career_licenciatura en planificación y diseño d... ... \n", + "career_licenciatura en producción de bioimagenes ... \n", + "career_licenciatura en psicología ... \n", + "career_licenciatura en relaciones del trabajo ... \n", + "career_licenciatura en sociología ... \n", + "career_licenciatura en terapia ocupacional ... \n", + "career_medicina ... \n", + "career_técnico para bioterios ... \n", + "\n", + " career_licenciatura en kinesiología y fisiatría \\\n", + "gender_female -0.001301 \n", + "gender_male 0.001301 \n", + "career_actuario -0.030784 \n", + "career_agronomía -0.027208 \n", + "career_arquitectura -0.028069 \n", + "career_bioquímica -0.028350 \n", + "career_ciencias veterinarias -0.028907 \n", + "career_contador público -0.027208 \n", + "career_diseño de imagen y sonido -0.030784 \n", + "career_diseño industrial -0.032567 \n", + "career_farmacia -0.027784 \n", + "career_ingeniería electrónica -0.026020 \n", + "career_ingeniería en informática -0.030522 \n", + "career_ingeniería mecánica -0.029992 \n", + "career_licenciatura en administración -0.030784 \n", + "career_licenciatura en artes -0.031044 \n", + "career_licenciatura en ciencia política -0.031302 \n", + "career_licenciatura en ciencia y tecnología de ... -0.029454 \n", + "career_licenciatura en ciencias ambientales -0.026620 \n", + "career_licenciatura en ciencias antropológicas -0.029181 \n", + "career_licenciatura en ciencias biológicas -0.031044 \n", + "career_licenciatura en ciencias de la computación -0.028350 \n", + "career_licenciatura en ciencias de la educación -0.027497 \n", + "career_licenciatura en ciencias geológicas -0.029724 \n", + "career_licenciatura en gestión de agroalimentos -0.028069 \n", + "career_licenciatura en kinesiología y fisiatría 1.000000 \n", + "career_licenciatura en musicoterapia -0.032066 \n", + "career_licenciatura en planificación y diseño d... -0.031302 \n", + "career_licenciatura en producción de bioimagenes -0.029992 \n", + "career_licenciatura en psicología -0.026620 \n", + "career_licenciatura en relaciones del trabajo -0.026020 \n", + "career_licenciatura en sociología -0.029992 \n", + "career_licenciatura en terapia ocupacional -0.028630 \n", + "career_medicina -0.033549 \n", + "career_técnico para bioterios -0.028630 \n", + "\n", + " career_licenciatura en musicoterapia \\\n", + "gender_female 0.014150 \n", + "gender_male -0.014150 \n", + "career_actuario -0.035899 \n", + "career_agronomía -0.031728 \n", + "career_arquitectura -0.032732 \n", + "career_bioquímica -0.033061 \n", + "career_ciencias veterinarias -0.033710 \n", + "career_contador público -0.031728 \n", + "career_diseño de imagen y sonido -0.035899 \n", + "career_diseño industrial -0.037978 \n", + "career_farmacia -0.032401 \n", + "career_ingeniería electrónica -0.030343 \n", + "career_ingeniería en informática -0.035593 \n", + "career_ingeniería mecánica -0.034975 \n", + "career_licenciatura en administración -0.035899 \n", + "career_licenciatura en artes -0.036202 \n", + "career_licenciatura en ciencia política -0.036503 \n", + "career_licenciatura en ciencia y tecnología de ... -0.034347 \n", + "career_licenciatura en ciencias ambientales -0.031043 \n", + "career_licenciatura en ciencias antropológicas -0.034030 \n", + "career_licenciatura en ciencias biológicas -0.036202 \n", + "career_licenciatura en ciencias de la computación -0.033061 \n", + "career_licenciatura en ciencias de la educación -0.032066 \n", + "career_licenciatura en ciencias geológicas -0.034663 \n", + "career_licenciatura en gestión de agroalimentos -0.032732 \n", + "career_licenciatura en kinesiología y fisiatría -0.032066 \n", + "career_licenciatura en musicoterapia 1.000000 \n", + "career_licenciatura en planificación y diseño d... -0.036503 \n", + "career_licenciatura en producción de bioimagenes -0.034975 \n", + "career_licenciatura en psicología -0.031043 \n", + "career_licenciatura en relaciones del trabajo -0.030343 \n", + "career_licenciatura en sociología -0.034975 \n", + "career_licenciatura en terapia ocupacional -0.033387 \n", + "career_medicina -0.039123 \n", + "career_técnico para bioterios -0.033387 \n", + "\n", + " career_licenciatura en planificación y diseño del paisaje \\\n", + "gender_female 0.011361 \n", + "gender_male -0.011361 \n", + "career_actuario -0.035043 \n", + "career_agronomía -0.030972 \n", + "career_arquitectura -0.031952 \n", + "career_bioquímica -0.032273 \n", + "career_ciencias veterinarias -0.032907 \n", + "career_contador público -0.030972 \n", + "career_diseño de imagen y sonido -0.035043 \n", + "career_diseño industrial -0.037073 \n", + "career_farmacia -0.031629 \n", + "career_ingeniería electrónica -0.029621 \n", + "career_ingeniería en informática -0.034745 \n", + "career_ingeniería mecánica -0.034142 \n", + "career_licenciatura en administración -0.035043 \n", + "career_licenciatura en artes -0.035340 \n", + "career_licenciatura en ciencia política -0.035633 \n", + "career_licenciatura en ciencia y tecnología de ... -0.033529 \n", + "career_licenciatura en ciencias ambientales -0.030303 \n", + "career_licenciatura en ciencias antropológicas -0.033219 \n", + "career_licenciatura en ciencias biológicas -0.035340 \n", + "career_licenciatura en ciencias de la computación -0.032273 \n", + "career_licenciatura en ciencias de la educación -0.031302 \n", + "career_licenciatura en ciencias geológicas -0.033837 \n", + "career_licenciatura en gestión de agroalimentos -0.031952 \n", + "career_licenciatura en kinesiología y fisiatría -0.031302 \n", + "career_licenciatura en musicoterapia -0.036503 \n", + "career_licenciatura en planificación y diseño d... 1.000000 \n", + "career_licenciatura en producción de bioimagenes -0.034142 \n", + "career_licenciatura en psicología -0.030303 \n", + "career_licenciatura en relaciones del trabajo -0.029621 \n", + "career_licenciatura en sociología -0.034142 \n", + "career_licenciatura en terapia ocupacional -0.032591 \n", + "career_medicina -0.038191 \n", + "career_técnico para bioterios -0.032591 \n", + "\n", + " career_licenciatura en producción de bioimagenes \\\n", + "gender_female 0.045933 \n", + "gender_male -0.045933 \n", + "career_actuario -0.033577 \n", + "career_agronomía -0.029676 \n", + "career_arquitectura -0.030615 \n", + "career_bioquímica -0.030922 \n", + "career_ciencias veterinarias -0.031529 \n", + "career_contador público -0.029676 \n", + "career_diseño de imagen y sonido -0.033577 \n", + "career_diseño industrial -0.035521 \n", + "career_farmacia -0.030305 \n", + "career_ingeniería electrónica -0.028381 \n", + "career_ingeniería en informática -0.033291 \n", + "career_ingeniería mecánica -0.032713 \n", + "career_licenciatura en administración -0.033577 \n", + "career_licenciatura en artes -0.033860 \n", + "career_licenciatura en ciencia política -0.034142 \n", + "career_licenciatura en ciencia y tecnología de ... -0.032126 \n", + "career_licenciatura en ciencias ambientales -0.029035 \n", + "career_licenciatura en ciencias antropológicas -0.031829 \n", + "career_licenciatura en ciencias biológicas -0.033860 \n", + "career_licenciatura en ciencias de la computación -0.030922 \n", + "career_licenciatura en ciencias de la educación -0.029992 \n", + "career_licenciatura en ciencias geológicas -0.032421 \n", + "career_licenciatura en gestión de agroalimentos -0.030615 \n", + "career_licenciatura en kinesiología y fisiatría -0.029992 \n", + "career_licenciatura en musicoterapia -0.034975 \n", + "career_licenciatura en planificación y diseño d... -0.034142 \n", + "career_licenciatura en producción de bioimagenes 1.000000 \n", + "career_licenciatura en psicología -0.029035 \n", + "career_licenciatura en relaciones del trabajo -0.028381 \n", + "career_licenciatura en sociología -0.032713 \n", + "career_licenciatura en terapia ocupacional -0.031227 \n", + "career_medicina -0.036593 \n", + "career_técnico para bioterios -0.031227 \n", + "\n", + " career_licenciatura en psicología \\\n", + "gender_female 0.002017 \n", + "gender_male -0.002017 \n", + "career_actuario -0.029801 \n", + "career_agronomía -0.026339 \n", + "career_arquitectura -0.027173 \n", + "career_bioquímica -0.027446 \n", + "career_ciencias veterinarias -0.027984 \n", + "career_contador público -0.026339 \n", + "career_diseño de imagen y sonido -0.029801 \n", + "career_diseño industrial -0.031527 \n", + "career_farmacia -0.026898 \n", + "career_ingeniería electrónica -0.025190 \n", + "career_ingeniería en informática -0.029548 \n", + "career_ingeniería mecánica -0.029035 \n", + "career_licenciatura en administración -0.029801 \n", + "career_licenciatura en artes -0.030053 \n", + "career_licenciatura en ciencia política -0.030303 \n", + "career_licenciatura en ciencia y tecnología de ... -0.028514 \n", + "career_licenciatura en ciencias ambientales -0.025770 \n", + "career_licenciatura en ciencias antropológicas -0.028250 \n", + "career_licenciatura en ciencias biológicas -0.030053 \n", + "career_licenciatura en ciencias de la computación -0.027446 \n", + "career_licenciatura en ciencias de la educación -0.026620 \n", + "career_licenciatura en ciencias geológicas -0.028775 \n", + "career_licenciatura en gestión de agroalimentos -0.027173 \n", + "career_licenciatura en kinesiología y fisiatría -0.026620 \n", + "career_licenciatura en musicoterapia -0.031043 \n", + "career_licenciatura en planificación y diseño d... -0.030303 \n", + "career_licenciatura en producción de bioimagenes -0.029035 \n", + "career_licenciatura en psicología 1.000000 \n", + "career_licenciatura en relaciones del trabajo -0.025190 \n", + "career_licenciatura en sociología -0.029035 \n", + "career_licenciatura en terapia ocupacional -0.027716 \n", + "career_medicina -0.032478 \n", + "career_técnico para bioterios -0.027716 \n", + "\n", + " career_licenciatura en relaciones del trabajo \\\n", + "gender_female 0.037637 \n", + "gender_male -0.037637 \n", + "career_actuario -0.029130 \n", + "career_agronomía -0.025746 \n", + "career_arquitectura -0.026561 \n", + "career_bioquímica -0.026827 \n", + "career_ciencias veterinarias -0.027354 \n", + "career_contador público -0.025746 \n", + "career_diseño de imagen y sonido -0.029130 \n", + "career_diseño industrial -0.030817 \n", + "career_farmacia -0.026292 \n", + "career_ingeniería electrónica -0.024622 \n", + "career_ingeniería en informática -0.028882 \n", + "career_ingeniería mecánica -0.028381 \n", + "career_licenciatura en administración -0.029130 \n", + "career_licenciatura en artes -0.029376 \n", + "career_licenciatura en ciencia política -0.029621 \n", + "career_licenciatura en ciencia y tecnología de ... -0.027871 \n", + "career_licenciatura en ciencias ambientales -0.025190 \n", + "career_licenciatura en ciencias antropológicas -0.027614 \n", + "career_licenciatura en ciencias biológicas -0.029376 \n", + "career_licenciatura en ciencias de la computación -0.026827 \n", + "career_licenciatura en ciencias de la educación -0.026020 \n", + "career_licenciatura en ciencias geológicas -0.028127 \n", + "career_licenciatura en gestión de agroalimentos -0.026561 \n", + "career_licenciatura en kinesiología y fisiatría -0.026020 \n", + "career_licenciatura en musicoterapia -0.030343 \n", + "career_licenciatura en planificación y diseño d... -0.029621 \n", + "career_licenciatura en producción de bioimagenes -0.028381 \n", + "career_licenciatura en psicología -0.025190 \n", + "career_licenciatura en relaciones del trabajo 1.000000 \n", + "career_licenciatura en sociología -0.028381 \n", + "career_licenciatura en terapia ocupacional -0.027092 \n", + "career_medicina -0.031747 \n", + "career_técnico para bioterios -0.027092 \n", + "\n", + " career_licenciatura en sociología \\\n", + "gender_female -0.022677 \n", + "gender_male 0.022677 \n", + "career_actuario -0.033577 \n", + "career_agronomía -0.029676 \n", + "career_arquitectura -0.030615 \n", + "career_bioquímica -0.030922 \n", + "career_ciencias veterinarias -0.031529 \n", + "career_contador público -0.029676 \n", + "career_diseño de imagen y sonido -0.033577 \n", + "career_diseño industrial -0.035521 \n", + "career_farmacia -0.030305 \n", + "career_ingeniería electrónica -0.028381 \n", + "career_ingeniería en informática -0.033291 \n", + "career_ingeniería mecánica -0.032713 \n", + "career_licenciatura en administración -0.033577 \n", + "career_licenciatura en artes -0.033860 \n", + "career_licenciatura en ciencia política -0.034142 \n", + "career_licenciatura en ciencia y tecnología de ... -0.032126 \n", + "career_licenciatura en ciencias ambientales -0.029035 \n", + "career_licenciatura en ciencias antropológicas -0.031829 \n", + "career_licenciatura en ciencias biológicas -0.033860 \n", + "career_licenciatura en ciencias de la computación -0.030922 \n", + "career_licenciatura en ciencias de la educación -0.029992 \n", + "career_licenciatura en ciencias geológicas -0.032421 \n", + "career_licenciatura en gestión de agroalimentos -0.030615 \n", + "career_licenciatura en kinesiología y fisiatría -0.029992 \n", + "career_licenciatura en musicoterapia -0.034975 \n", + "career_licenciatura en planificación y diseño d... -0.034142 \n", + "career_licenciatura en producción de bioimagenes -0.032713 \n", + "career_licenciatura en psicología -0.029035 \n", + "career_licenciatura en relaciones del trabajo -0.028381 \n", + "career_licenciatura en sociología 1.000000 \n", + "career_licenciatura en terapia ocupacional -0.031227 \n", + "career_medicina -0.036593 \n", + "career_técnico para bioterios -0.031227 \n", + "\n", + " career_licenciatura en terapia ocupacional \\\n", + "gender_female -0.020636 \n", + "gender_male 0.020636 \n", + "career_actuario -0.032052 \n", + "career_agronomía -0.028328 \n", + "career_arquitectura -0.029225 \n", + "career_bioquímica -0.029518 \n", + "career_ciencias veterinarias -0.030097 \n", + "career_contador público -0.028328 \n", + "career_diseño de imagen y sonido -0.032052 \n", + "career_diseño industrial -0.033908 \n", + "career_farmacia -0.028928 \n", + "career_ingeniería electrónica -0.027092 \n", + "career_ingeniería en informática -0.031779 \n", + "career_ingeniería mecánica -0.031227 \n", + "career_licenciatura en administración -0.032052 \n", + "career_licenciatura en artes -0.032322 \n", + "career_licenciatura en ciencia política -0.032591 \n", + "career_licenciatura en ciencia y tecnología de ... -0.030667 \n", + "career_licenciatura en ciencias ambientales -0.027716 \n", + "career_licenciatura en ciencias antropológicas -0.030383 \n", + "career_licenciatura en ciencias biológicas -0.032322 \n", + "career_licenciatura en ciencias de la computación -0.029518 \n", + "career_licenciatura en ciencias de la educación -0.028630 \n", + "career_licenciatura en ciencias geológicas -0.030948 \n", + "career_licenciatura en gestión de agroalimentos -0.029225 \n", + "career_licenciatura en kinesiología y fisiatría -0.028630 \n", + "career_licenciatura en musicoterapia -0.033387 \n", + "career_licenciatura en planificación y diseño d... -0.032591 \n", + "career_licenciatura en producción de bioimagenes -0.031227 \n", + "career_licenciatura en psicología -0.027716 \n", + "career_licenciatura en relaciones del trabajo -0.027092 \n", + "career_licenciatura en sociología -0.031227 \n", + "career_licenciatura en terapia ocupacional 1.000000 \n", + "career_medicina -0.034931 \n", + "career_técnico para bioterios -0.029809 \n", + "\n", + " career_medicina \\\n", + "gender_female 0.002542 \n", + "gender_male -0.002542 \n", + "career_actuario -0.037559 \n", + "career_agronomía -0.033195 \n", + "career_arquitectura -0.034246 \n", + "career_bioquímica -0.034590 \n", + "career_ciencias veterinarias -0.035268 \n", + "career_contador público -0.033195 \n", + "career_diseño de imagen y sonido -0.037559 \n", + "career_diseño industrial -0.039734 \n", + "career_farmacia -0.033899 \n", + "career_ingeniería electrónica -0.031747 \n", + "career_ingeniería en informática -0.037239 \n", + "career_ingeniería mecánica -0.036593 \n", + "career_licenciatura en administración -0.037559 \n", + "career_licenciatura en artes -0.037876 \n", + "career_licenciatura en ciencia política -0.038191 \n", + "career_licenciatura en ciencia y tecnología de ... -0.035936 \n", + "career_licenciatura en ciencias ambientales -0.032478 \n", + "career_licenciatura en ciencias antropológicas -0.035604 \n", + "career_licenciatura en ciencias biológicas -0.037876 \n", + "career_licenciatura en ciencias de la computación -0.034590 \n", + "career_licenciatura en ciencias de la educación -0.033549 \n", + "career_licenciatura en ciencias geológicas -0.036266 \n", + "career_licenciatura en gestión de agroalimentos -0.034246 \n", + "career_licenciatura en kinesiología y fisiatría -0.033549 \n", + "career_licenciatura en musicoterapia -0.039123 \n", + "career_licenciatura en planificación y diseño d... -0.038191 \n", + "career_licenciatura en producción de bioimagenes -0.036593 \n", + "career_licenciatura en psicología -0.032478 \n", + "career_licenciatura en relaciones del trabajo -0.031747 \n", + "career_licenciatura en sociología -0.036593 \n", + "career_licenciatura en terapia ocupacional -0.034931 \n", + "career_medicina 1.000000 \n", + "career_técnico para bioterios -0.034931 \n", + "\n", + " career_técnico para bioterios \n", + "gender_female 0.031490 \n", + "gender_male -0.031490 \n", + "career_actuario -0.032052 \n", + "career_agronomía -0.028328 \n", + "career_arquitectura -0.029225 \n", + "career_bioquímica -0.029518 \n", + "career_ciencias veterinarias -0.030097 \n", + "career_contador público -0.028328 \n", + "career_diseño de imagen y sonido -0.032052 \n", + "career_diseño industrial -0.033908 \n", + "career_farmacia -0.028928 \n", + "career_ingeniería electrónica -0.027092 \n", + "career_ingeniería en informática -0.031779 \n", + "career_ingeniería mecánica -0.031227 \n", + "career_licenciatura en administración -0.032052 \n", + "career_licenciatura en artes -0.032322 \n", + "career_licenciatura en ciencia política -0.032591 \n", + "career_licenciatura en ciencia y tecnología de ... -0.030667 \n", + "career_licenciatura en ciencias ambientales -0.027716 \n", + "career_licenciatura en ciencias antropológicas -0.030383 \n", + "career_licenciatura en ciencias biológicas -0.032322 \n", + "career_licenciatura en ciencias de la computación -0.029518 \n", + "career_licenciatura en ciencias de la educación -0.028630 \n", + "career_licenciatura en ciencias geológicas -0.030948 \n", + "career_licenciatura en gestión de agroalimentos -0.029225 \n", + "career_licenciatura en kinesiología y fisiatría -0.028630 \n", + "career_licenciatura en musicoterapia -0.033387 \n", + "career_licenciatura en planificación y diseño d... -0.032591 \n", + "career_licenciatura en producción de bioimagenes -0.031227 \n", + "career_licenciatura en psicología -0.027716 \n", + "career_licenciatura en relaciones del trabajo -0.027092 \n", + "career_licenciatura en sociología -0.031227 \n", + "career_licenciatura en terapia ocupacional -0.029809 \n", + "career_medicina -0.034931 \n", + "career_técnico para bioterios 1.000000 \n", + "\n", + "[35 rows x 35 columns]" + ] + }, + "execution_count": 120, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "correlacion1 = dfg1.corr()\n", + "# correlacion\n", + "correlacion1" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "78b140df", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "a0ef42a1", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": 122, + "id": "dcfaf463", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
gender_femalegender_malecareer_actuariocareer_agronomíacareer_arquitecturacareer_bioquímicacareer_ciencias veterinariascareer_contador públicocareer_diseño de imagen y sonidocareer_diseño industrial...career_licenciatura en kinesiología y fisiatríacareer_licenciatura en musicoterapiacareer_licenciatura en planificación y diseño del paisajecareer_licenciatura en producción de bioimagenescareer_licenciatura en psicologíacareer_licenciatura en relaciones del trabajocareer_licenciatura en sociologíacareer_licenciatura en terapia ocupacionalcareer_medicinacareer_técnico para bioterios
gender_female1.000000-1.0000000.0647560.019895-0.0322130.0026160.027091-0.025293-0.0167910.007851...0.019595-0.0140090.0448690.022949-0.004099-0.0076410.0256630.001113-0.0075040.028664
gender_male-1.0000001.000000-0.064756-0.0198950.032213-0.002616-0.0270910.0252930.016791-0.007851...-0.0195950.014009-0.044869-0.0229490.0040990.007641-0.025663-0.0011130.007504-0.028664
career_actuario0.064756-0.0647561.000000-0.027736-0.024941-0.028613-0.029746-0.033192-0.031905-0.030298...-0.030842-0.033695-0.030298-0.030571-0.029184-0.030571-0.030842-0.031377-0.030023-0.028613
career_agronomía0.019895-0.019895-0.0277361.000000-0.023255-0.026680-0.027736-0.030949-0.029749-0.028251...-0.028758-0.031418-0.028251-0.028506-0.027212-0.028506-0.028758-0.029257-0.027995-0.026680
career_arquitectura-0.0322130.032213-0.024941-0.0232551.000000-0.023991-0.024941-0.027830-0.026751-0.025404...-0.025860-0.028252-0.025404-0.025633-0.024470-0.025633-0.025860-0.026308-0.025173-0.023991
career_bioquímica0.002616-0.002616-0.028613-0.026680-0.0239911.000000-0.028613-0.031928-0.030690-0.029144...-0.029667-0.032411-0.029144-0.029407-0.028073-0.029407-0.029667-0.030182-0.028880-0.027523
career_ciencias veterinarias0.027091-0.027091-0.029746-0.027736-0.024941-0.0286131.000000-0.033192-0.031905-0.030298...-0.030842-0.033695-0.030298-0.030571-0.029184-0.030571-0.030842-0.031377-0.030023-0.028613
career_contador público-0.0252930.025293-0.033192-0.030949-0.027830-0.031928-0.0331921.000000-0.035601-0.033808...-0.034415-0.037598-0.033808-0.034113-0.032565-0.034113-0.034415-0.035012-0.033501-0.031928
career_diseño de imagen y sonido-0.0167910.016791-0.031905-0.029749-0.026751-0.030690-0.031905-0.0356011.000000-0.032497...-0.033080-0.036140-0.032497-0.032790-0.031302-0.032790-0.033080-0.033655-0.032202-0.030690
career_diseño industrial0.007851-0.007851-0.030298-0.028251-0.025404-0.029144-0.030298-0.033808-0.0324971.000000...-0.031415-0.034320-0.030861-0.031139-0.029726-0.031139-0.031415-0.031960-0.030581-0.029144
career_farmacia-0.0285480.028548-0.031905-0.029749-0.026751-0.030690-0.031905-0.035601-0.034221-0.032497...-0.033080-0.036140-0.032497-0.032790-0.031302-0.032790-0.033080-0.033655-0.032202-0.030690
career_ingeniería electrónica-0.0265760.026576-0.028900-0.026947-0.024231-0.027799-0.028900-0.032248-0.030997-0.029436...-0.029965-0.032736-0.029436-0.029702-0.028354-0.029702-0.029965-0.030485-0.029169-0.027799
career_ingeniería en informática-0.0350120.035012-0.030842-0.028758-0.025860-0.029667-0.030842-0.034415-0.033080-0.031415...-0.031978-0.034936-0.031415-0.031698-0.030260-0.031698-0.031978-0.032533-0.031129-0.029667
career_ingeniería mecánica0.007851-0.007851-0.030298-0.028251-0.025404-0.029144-0.030298-0.033808-0.032497-0.030861...-0.031415-0.034320-0.030861-0.031139-0.029726-0.031139-0.031415-0.031960-0.030581-0.029144
career_licenciatura en administración0.012599-0.012599-0.031905-0.029749-0.026751-0.030690-0.031905-0.035601-0.034221-0.032497...-0.033080-0.036140-0.032497-0.032790-0.031302-0.032790-0.033080-0.033655-0.032202-0.030690
career_licenciatura en artes-0.0232730.023273-0.029184-0.027212-0.024470-0.028073-0.029184-0.032565-0.031302-0.029726...-0.030260-0.033059-0.029726-0.029994-0.028633-0.029994-0.030260-0.030785-0.029456-0.028073
career_licenciatura en ciencia política0.001113-0.001113-0.031377-0.029257-0.026308-0.030182-0.031377-0.035012-0.033655-0.031960...-0.032533-0.035543-0.031960-0.032248-0.030785-0.032248-0.032533-0.033098-0.031670-0.030182
career_licenciatura en ciencia y tecnología de alimentos0.002293-0.002293-0.029184-0.027212-0.024470-0.028073-0.029184-0.032565-0.031302-0.029726...-0.030260-0.033059-0.029726-0.029994-0.028633-0.029994-0.030260-0.030785-0.029456-0.028073
career_licenciatura en ciencias ambientales-0.0168810.016881-0.029184-0.027212-0.024470-0.028073-0.029184-0.032565-0.031302-0.029726...-0.030260-0.033059-0.029726-0.029994-0.028633-0.029994-0.030260-0.030785-0.029456-0.028073
career_licenciatura en ciencias antropológicas0.026984-0.026984-0.034437-0.032111-0.028874-0.033126-0.034437-0.038427-0.036937-0.035077...-0.035706-0.039009-0.035077-0.035393-0.033787-0.035393-0.035706-0.036326-0.034758-0.033126
career_licenciatura en ciencias biológicas0.004261-0.004261-0.031111-0.029009-0.026085-0.029926-0.031111-0.034715-0.033369-0.031688...-0.032257-0.035241-0.031688-0.031974-0.030523-0.031974-0.032257-0.032817-0.031401-0.029926
career_licenciatura en ciencias de la computación-0.0197070.019707-0.032166-0.029993-0.026970-0.030941-0.032166-0.035892-0.034500-0.032763...-0.033351-0.036436-0.032763-0.033058-0.031558-0.033058-0.033351-0.033930-0.032466-0.030941
career_licenciatura en ciencias de la educación-0.0168270.016827-0.030298-0.028251-0.025404-0.029144-0.030298-0.033808-0.032497-0.030861...-0.031415-0.034320-0.030861-0.031139-0.029726-0.031139-0.031415-0.031960-0.030581-0.029144
career_licenciatura en ciencias geológicas-0.0627020.062702-0.030571-0.028506-0.025633-0.029407-0.030571-0.034113-0.032790-0.031139...-0.031698-0.034630-0.031139-0.031419-0.029994-0.031419-0.031698-0.032248-0.030856-0.029407
career_licenciatura en gestión de agroalimentos0.016298-0.016298-0.031111-0.029009-0.026085-0.029926-0.031111-0.034715-0.033369-0.031688...-0.032257-0.035241-0.031688-0.031974-0.030523-0.031974-0.032257-0.032817-0.031401-0.029926
career_licenciatura en kinesiología y fisiatría0.019595-0.019595-0.030842-0.028758-0.025860-0.029667-0.030842-0.034415-0.033080-0.031415...1.000000-0.034936-0.031415-0.031698-0.030260-0.031698-0.031978-0.032533-0.031129-0.029667
career_licenciatura en musicoterapia-0.0140090.014009-0.033695-0.031418-0.028252-0.032411-0.033695-0.037598-0.036140-0.034320...-0.0349361.000000-0.034320-0.034630-0.033059-0.034630-0.034936-0.035543-0.034009-0.032411
career_licenciatura en planificación y diseño del paisaje0.044869-0.044869-0.030298-0.028251-0.025404-0.029144-0.030298-0.033808-0.032497-0.030861...-0.031415-0.0343201.000000-0.031139-0.029726-0.031139-0.031415-0.031960-0.030581-0.029144
career_licenciatura en producción de bioimagenes0.022949-0.022949-0.030571-0.028506-0.025633-0.029407-0.030571-0.034113-0.032790-0.031139...-0.031698-0.034630-0.0311391.000000-0.029994-0.031419-0.031698-0.032248-0.030856-0.029407
career_licenciatura en psicología-0.0040990.004099-0.029184-0.027212-0.024470-0.028073-0.029184-0.032565-0.031302-0.029726...-0.030260-0.033059-0.029726-0.0299941.000000-0.029994-0.030260-0.030785-0.029456-0.028073
career_licenciatura en relaciones del trabajo-0.0076410.007641-0.030571-0.028506-0.025633-0.029407-0.030571-0.034113-0.032790-0.031139...-0.031698-0.034630-0.031139-0.031419-0.0299941.000000-0.031698-0.032248-0.030856-0.029407
career_licenciatura en sociología0.025663-0.025663-0.030842-0.028758-0.025860-0.029667-0.030842-0.034415-0.033080-0.031415...-0.031978-0.034936-0.031415-0.031698-0.030260-0.0316981.000000-0.032533-0.031129-0.029667
career_licenciatura en terapia ocupacional0.001113-0.001113-0.031377-0.029257-0.026308-0.030182-0.031377-0.035012-0.033655-0.031960...-0.032533-0.035543-0.031960-0.032248-0.030785-0.032248-0.0325331.000000-0.031670-0.030182
career_medicina-0.0075040.007504-0.030023-0.027995-0.025173-0.028880-0.030023-0.033501-0.032202-0.030581...-0.031129-0.034009-0.030581-0.030856-0.029456-0.030856-0.031129-0.0316701.000000-0.028880
career_técnico para bioterios0.028664-0.028664-0.028613-0.026680-0.023991-0.027523-0.028613-0.031928-0.030690-0.029144...-0.029667-0.032411-0.029144-0.029407-0.028073-0.029407-0.029667-0.030182-0.0288801.000000
\n", + "

35 rows × 35 columns

\n", + "
" + ], + "text/plain": [ + " gender_female \\\n", + "gender_female 1.000000 \n", + "gender_male -1.000000 \n", + "career_actuario 0.064756 \n", + "career_agronomía 0.019895 \n", + "career_arquitectura -0.032213 \n", + "career_bioquímica 0.002616 \n", + "career_ciencias veterinarias 0.027091 \n", + "career_contador público -0.025293 \n", + "career_diseño de imagen y sonido -0.016791 \n", + "career_diseño industrial 0.007851 \n", + "career_farmacia -0.028548 \n", + "career_ingeniería electrónica -0.026576 \n", + "career_ingeniería en informática -0.035012 \n", + "career_ingeniería mecánica 0.007851 \n", + "career_licenciatura en administración 0.012599 \n", + "career_licenciatura en artes -0.023273 \n", + "career_licenciatura en ciencia política 0.001113 \n", + "career_licenciatura en ciencia y tecnología de ... 0.002293 \n", + "career_licenciatura en ciencias ambientales -0.016881 \n", + "career_licenciatura en ciencias antropológicas 0.026984 \n", + "career_licenciatura en ciencias biológicas 0.004261 \n", + "career_licenciatura en ciencias de la computación -0.019707 \n", + "career_licenciatura en ciencias de la educación -0.016827 \n", + "career_licenciatura en ciencias geológicas -0.062702 \n", + "career_licenciatura en gestión de agroalimentos 0.016298 \n", + "career_licenciatura en kinesiología y fisiatría 0.019595 \n", + "career_licenciatura en musicoterapia -0.014009 \n", + "career_licenciatura en planificación y diseño d... 0.044869 \n", + "career_licenciatura en producción de bioimagenes 0.022949 \n", + "career_licenciatura en psicología -0.004099 \n", + "career_licenciatura en relaciones del trabajo -0.007641 \n", + "career_licenciatura en sociología 0.025663 \n", + "career_licenciatura en terapia ocupacional 0.001113 \n", + "career_medicina -0.007504 \n", + "career_técnico para bioterios 0.028664 \n", + "\n", + " gender_male \\\n", + "gender_female -1.000000 \n", + "gender_male 1.000000 \n", + "career_actuario -0.064756 \n", + "career_agronomía -0.019895 \n", + "career_arquitectura 0.032213 \n", + "career_bioquímica -0.002616 \n", + "career_ciencias veterinarias -0.027091 \n", + "career_contador público 0.025293 \n", + "career_diseño de imagen y sonido 0.016791 \n", + "career_diseño industrial -0.007851 \n", + "career_farmacia 0.028548 \n", + "career_ingeniería electrónica 0.026576 \n", + "career_ingeniería en informática 0.035012 \n", + "career_ingeniería mecánica -0.007851 \n", + "career_licenciatura en administración -0.012599 \n", + "career_licenciatura en artes 0.023273 \n", + "career_licenciatura en ciencia política -0.001113 \n", + "career_licenciatura en ciencia y tecnología de ... -0.002293 \n", + "career_licenciatura en ciencias ambientales 0.016881 \n", + "career_licenciatura en ciencias antropológicas -0.026984 \n", + "career_licenciatura en ciencias biológicas -0.004261 \n", + "career_licenciatura en ciencias de la computación 0.019707 \n", + "career_licenciatura en ciencias de la educación 0.016827 \n", + "career_licenciatura en ciencias geológicas 0.062702 \n", + "career_licenciatura en gestión de agroalimentos -0.016298 \n", + "career_licenciatura en kinesiología y fisiatría -0.019595 \n", + "career_licenciatura en musicoterapia 0.014009 \n", + "career_licenciatura en planificación y diseño d... -0.044869 \n", + "career_licenciatura en producción de bioimagenes -0.022949 \n", + "career_licenciatura en psicología 0.004099 \n", + "career_licenciatura en relaciones del trabajo 0.007641 \n", + "career_licenciatura en sociología -0.025663 \n", + "career_licenciatura en terapia ocupacional -0.001113 \n", + "career_medicina 0.007504 \n", + "career_técnico para bioterios -0.028664 \n", + "\n", + " career_actuario \\\n", + "gender_female 0.064756 \n", + "gender_male -0.064756 \n", + "career_actuario 1.000000 \n", + "career_agronomía -0.027736 \n", + "career_arquitectura -0.024941 \n", + "career_bioquímica -0.028613 \n", + "career_ciencias veterinarias -0.029746 \n", + "career_contador público -0.033192 \n", + "career_diseño de imagen y sonido -0.031905 \n", + "career_diseño industrial -0.030298 \n", + "career_farmacia -0.031905 \n", + "career_ingeniería electrónica -0.028900 \n", + "career_ingeniería en informática -0.030842 \n", + "career_ingeniería mecánica -0.030298 \n", + "career_licenciatura en administración -0.031905 \n", + "career_licenciatura en artes -0.029184 \n", + "career_licenciatura en ciencia política -0.031377 \n", + "career_licenciatura en ciencia y tecnología de ... -0.029184 \n", + "career_licenciatura en ciencias ambientales -0.029184 \n", + "career_licenciatura en ciencias antropológicas -0.034437 \n", + "career_licenciatura en ciencias biológicas -0.031111 \n", + "career_licenciatura en ciencias de la computación -0.032166 \n", + "career_licenciatura en ciencias de la educación -0.030298 \n", + "career_licenciatura en ciencias geológicas -0.030571 \n", + "career_licenciatura en gestión de agroalimentos -0.031111 \n", + "career_licenciatura en kinesiología y fisiatría -0.030842 \n", + "career_licenciatura en musicoterapia -0.033695 \n", + "career_licenciatura en planificación y diseño d... -0.030298 \n", + "career_licenciatura en producción de bioimagenes -0.030571 \n", + "career_licenciatura en psicología -0.029184 \n", + "career_licenciatura en relaciones del trabajo -0.030571 \n", + "career_licenciatura en sociología -0.030842 \n", + "career_licenciatura en terapia ocupacional -0.031377 \n", + "career_medicina -0.030023 \n", + "career_técnico para bioterios -0.028613 \n", + "\n", + " career_agronomía \\\n", + "gender_female 0.019895 \n", + "gender_male -0.019895 \n", + "career_actuario -0.027736 \n", + "career_agronomía 1.000000 \n", + "career_arquitectura -0.023255 \n", + "career_bioquímica -0.026680 \n", + "career_ciencias veterinarias -0.027736 \n", + "career_contador público -0.030949 \n", + "career_diseño de imagen y sonido -0.029749 \n", + "career_diseño industrial -0.028251 \n", + "career_farmacia -0.029749 \n", + "career_ingeniería electrónica -0.026947 \n", + "career_ingeniería en informática -0.028758 \n", + "career_ingeniería mecánica -0.028251 \n", + "career_licenciatura en administración -0.029749 \n", + "career_licenciatura en artes -0.027212 \n", + "career_licenciatura en ciencia política -0.029257 \n", + "career_licenciatura en ciencia y tecnología de ... -0.027212 \n", + "career_licenciatura en ciencias ambientales -0.027212 \n", + "career_licenciatura en ciencias antropológicas -0.032111 \n", + "career_licenciatura en ciencias biológicas -0.029009 \n", + "career_licenciatura en ciencias de la computación -0.029993 \n", + "career_licenciatura en ciencias de la educación -0.028251 \n", + "career_licenciatura en ciencias geológicas -0.028506 \n", + "career_licenciatura en gestión de agroalimentos -0.029009 \n", + "career_licenciatura en kinesiología y fisiatría -0.028758 \n", + "career_licenciatura en musicoterapia -0.031418 \n", + "career_licenciatura en planificación y diseño d... -0.028251 \n", + "career_licenciatura en producción de bioimagenes -0.028506 \n", + "career_licenciatura en psicología -0.027212 \n", + "career_licenciatura en relaciones del trabajo -0.028506 \n", + "career_licenciatura en sociología -0.028758 \n", + "career_licenciatura en terapia ocupacional -0.029257 \n", + "career_medicina -0.027995 \n", + "career_técnico para bioterios -0.026680 \n", + "\n", + " career_arquitectura \\\n", + "gender_female -0.032213 \n", + "gender_male 0.032213 \n", + "career_actuario -0.024941 \n", + "career_agronomía -0.023255 \n", + "career_arquitectura 1.000000 \n", + "career_bioquímica -0.023991 \n", + "career_ciencias veterinarias -0.024941 \n", + "career_contador público -0.027830 \n", + "career_diseño de imagen y sonido -0.026751 \n", + "career_diseño industrial -0.025404 \n", + "career_farmacia -0.026751 \n", + "career_ingeniería electrónica -0.024231 \n", + "career_ingeniería en informática -0.025860 \n", + "career_ingeniería mecánica -0.025404 \n", + "career_licenciatura en administración -0.026751 \n", + "career_licenciatura en artes -0.024470 \n", + "career_licenciatura en ciencia política -0.026308 \n", + "career_licenciatura en ciencia y tecnología de ... -0.024470 \n", + "career_licenciatura en ciencias ambientales -0.024470 \n", + "career_licenciatura en ciencias antropológicas -0.028874 \n", + "career_licenciatura en ciencias biológicas -0.026085 \n", + "career_licenciatura en ciencias de la computación -0.026970 \n", + "career_licenciatura en ciencias de la educación -0.025404 \n", + "career_licenciatura en ciencias geológicas -0.025633 \n", + "career_licenciatura en gestión de agroalimentos -0.026085 \n", + "career_licenciatura en kinesiología y fisiatría -0.025860 \n", + "career_licenciatura en musicoterapia -0.028252 \n", + "career_licenciatura en planificación y diseño d... -0.025404 \n", + "career_licenciatura en producción de bioimagenes -0.025633 \n", + "career_licenciatura en psicología -0.024470 \n", + "career_licenciatura en relaciones del trabajo -0.025633 \n", + "career_licenciatura en sociología -0.025860 \n", + "career_licenciatura en terapia ocupacional -0.026308 \n", + "career_medicina -0.025173 \n", + "career_técnico para bioterios -0.023991 \n", + "\n", + " career_bioquímica \\\n", + "gender_female 0.002616 \n", + "gender_male -0.002616 \n", + "career_actuario -0.028613 \n", + "career_agronomía -0.026680 \n", + "career_arquitectura -0.023991 \n", + "career_bioquímica 1.000000 \n", + "career_ciencias veterinarias -0.028613 \n", + "career_contador público -0.031928 \n", + "career_diseño de imagen y sonido -0.030690 \n", + "career_diseño industrial -0.029144 \n", + "career_farmacia -0.030690 \n", + "career_ingeniería electrónica -0.027799 \n", + "career_ingeniería en informática -0.029667 \n", + "career_ingeniería mecánica -0.029144 \n", + "career_licenciatura en administración -0.030690 \n", + "career_licenciatura en artes -0.028073 \n", + "career_licenciatura en ciencia política -0.030182 \n", + "career_licenciatura en ciencia y tecnología de ... -0.028073 \n", + "career_licenciatura en ciencias ambientales -0.028073 \n", + "career_licenciatura en ciencias antropológicas -0.033126 \n", + "career_licenciatura en ciencias biológicas -0.029926 \n", + "career_licenciatura en ciencias de la computación -0.030941 \n", + "career_licenciatura en ciencias de la educación -0.029144 \n", + "career_licenciatura en ciencias geológicas -0.029407 \n", + "career_licenciatura en gestión de agroalimentos -0.029926 \n", + "career_licenciatura en kinesiología y fisiatría -0.029667 \n", + "career_licenciatura en musicoterapia -0.032411 \n", + "career_licenciatura en planificación y diseño d... -0.029144 \n", + "career_licenciatura en producción de bioimagenes -0.029407 \n", + "career_licenciatura en psicología -0.028073 \n", + "career_licenciatura en relaciones del trabajo -0.029407 \n", + "career_licenciatura en sociología -0.029667 \n", + "career_licenciatura en terapia ocupacional -0.030182 \n", + "career_medicina -0.028880 \n", + "career_técnico para bioterios -0.027523 \n", + "\n", + " career_ciencias veterinarias \\\n", + "gender_female 0.027091 \n", + "gender_male -0.027091 \n", + "career_actuario -0.029746 \n", + "career_agronomía -0.027736 \n", + "career_arquitectura -0.024941 \n", + "career_bioquímica -0.028613 \n", + "career_ciencias veterinarias 1.000000 \n", + "career_contador público -0.033192 \n", + "career_diseño de imagen y sonido -0.031905 \n", + "career_diseño industrial -0.030298 \n", + "career_farmacia -0.031905 \n", + "career_ingeniería electrónica -0.028900 \n", + "career_ingeniería en informática -0.030842 \n", + "career_ingeniería mecánica -0.030298 \n", + "career_licenciatura en administración -0.031905 \n", + "career_licenciatura en artes -0.029184 \n", + "career_licenciatura en ciencia política -0.031377 \n", + "career_licenciatura en ciencia y tecnología de ... -0.029184 \n", + "career_licenciatura en ciencias ambientales -0.029184 \n", + "career_licenciatura en ciencias antropológicas -0.034437 \n", + "career_licenciatura en ciencias biológicas -0.031111 \n", + "career_licenciatura en ciencias de la computación -0.032166 \n", + "career_licenciatura en ciencias de la educación -0.030298 \n", + "career_licenciatura en ciencias geológicas -0.030571 \n", + "career_licenciatura en gestión de agroalimentos -0.031111 \n", + "career_licenciatura en kinesiología y fisiatría -0.030842 \n", + "career_licenciatura en musicoterapia -0.033695 \n", + "career_licenciatura en planificación y diseño d... -0.030298 \n", + "career_licenciatura en producción de bioimagenes -0.030571 \n", + "career_licenciatura en psicología -0.029184 \n", + "career_licenciatura en relaciones del trabajo -0.030571 \n", + "career_licenciatura en sociología -0.030842 \n", + "career_licenciatura en terapia ocupacional -0.031377 \n", + "career_medicina -0.030023 \n", + "career_técnico para bioterios -0.028613 \n", + "\n", + " career_contador público \\\n", + "gender_female -0.025293 \n", + "gender_male 0.025293 \n", + "career_actuario -0.033192 \n", + "career_agronomía -0.030949 \n", + "career_arquitectura -0.027830 \n", + "career_bioquímica -0.031928 \n", + "career_ciencias veterinarias -0.033192 \n", + "career_contador público 1.000000 \n", + "career_diseño de imagen y sonido -0.035601 \n", + "career_diseño industrial -0.033808 \n", + "career_farmacia -0.035601 \n", + "career_ingeniería electrónica -0.032248 \n", + "career_ingeniería en informática -0.034415 \n", + "career_ingeniería mecánica -0.033808 \n", + "career_licenciatura en administración -0.035601 \n", + "career_licenciatura en artes -0.032565 \n", + "career_licenciatura en ciencia política -0.035012 \n", + "career_licenciatura en ciencia y tecnología de ... -0.032565 \n", + "career_licenciatura en ciencias ambientales -0.032565 \n", + "career_licenciatura en ciencias antropológicas -0.038427 \n", + "career_licenciatura en ciencias biológicas -0.034715 \n", + "career_licenciatura en ciencias de la computación -0.035892 \n", + "career_licenciatura en ciencias de la educación -0.033808 \n", + "career_licenciatura en ciencias geológicas -0.034113 \n", + "career_licenciatura en gestión de agroalimentos -0.034715 \n", + "career_licenciatura en kinesiología y fisiatría -0.034415 \n", + "career_licenciatura en musicoterapia -0.037598 \n", + "career_licenciatura en planificación y diseño d... -0.033808 \n", + "career_licenciatura en producción de bioimagenes -0.034113 \n", + "career_licenciatura en psicología -0.032565 \n", + "career_licenciatura en relaciones del trabajo -0.034113 \n", + "career_licenciatura en sociología -0.034415 \n", + "career_licenciatura en terapia ocupacional -0.035012 \n", + "career_medicina -0.033501 \n", + "career_técnico para bioterios -0.031928 \n", + "\n", + " career_diseño de imagen y sonido \\\n", + "gender_female -0.016791 \n", + "gender_male 0.016791 \n", + "career_actuario -0.031905 \n", + "career_agronomía -0.029749 \n", + "career_arquitectura -0.026751 \n", + "career_bioquímica -0.030690 \n", + "career_ciencias veterinarias -0.031905 \n", + "career_contador público -0.035601 \n", + "career_diseño de imagen y sonido 1.000000 \n", + "career_diseño industrial -0.032497 \n", + "career_farmacia -0.034221 \n", + "career_ingeniería electrónica -0.030997 \n", + "career_ingeniería en informática -0.033080 \n", + "career_ingeniería mecánica -0.032497 \n", + "career_licenciatura en administración -0.034221 \n", + "career_licenciatura en artes -0.031302 \n", + "career_licenciatura en ciencia política -0.033655 \n", + "career_licenciatura en ciencia y tecnología de ... -0.031302 \n", + "career_licenciatura en ciencias ambientales -0.031302 \n", + "career_licenciatura en ciencias antropológicas -0.036937 \n", + "career_licenciatura en ciencias biológicas -0.033369 \n", + "career_licenciatura en ciencias de la computación -0.034500 \n", + "career_licenciatura en ciencias de la educación -0.032497 \n", + "career_licenciatura en ciencias geológicas -0.032790 \n", + "career_licenciatura en gestión de agroalimentos -0.033369 \n", + "career_licenciatura en kinesiología y fisiatría -0.033080 \n", + "career_licenciatura en musicoterapia -0.036140 \n", + "career_licenciatura en planificación y diseño d... -0.032497 \n", + "career_licenciatura en producción de bioimagenes -0.032790 \n", + "career_licenciatura en psicología -0.031302 \n", + "career_licenciatura en relaciones del trabajo -0.032790 \n", + "career_licenciatura en sociología -0.033080 \n", + "career_licenciatura en terapia ocupacional -0.033655 \n", + "career_medicina -0.032202 \n", + "career_técnico para bioterios -0.030690 \n", + "\n", + " career_diseño industrial \\\n", + "gender_female 0.007851 \n", + "gender_male -0.007851 \n", + "career_actuario -0.030298 \n", + "career_agronomía -0.028251 \n", + "career_arquitectura -0.025404 \n", + "career_bioquímica -0.029144 \n", + "career_ciencias veterinarias -0.030298 \n", + "career_contador público -0.033808 \n", + "career_diseño de imagen y sonido -0.032497 \n", + "career_diseño industrial 1.000000 \n", + "career_farmacia -0.032497 \n", + "career_ingeniería electrónica -0.029436 \n", + "career_ingeniería en informática -0.031415 \n", + "career_ingeniería mecánica -0.030861 \n", + "career_licenciatura en administración -0.032497 \n", + "career_licenciatura en artes -0.029726 \n", + "career_licenciatura en ciencia política -0.031960 \n", + "career_licenciatura en ciencia y tecnología de ... -0.029726 \n", + "career_licenciatura en ciencias ambientales -0.029726 \n", + "career_licenciatura en ciencias antropológicas -0.035077 \n", + "career_licenciatura en ciencias biológicas -0.031688 \n", + "career_licenciatura en ciencias de la computación -0.032763 \n", + "career_licenciatura en ciencias de la educación -0.030861 \n", + "career_licenciatura en ciencias geológicas -0.031139 \n", + "career_licenciatura en gestión de agroalimentos -0.031688 \n", + "career_licenciatura en kinesiología y fisiatría -0.031415 \n", + "career_licenciatura en musicoterapia -0.034320 \n", + "career_licenciatura en planificación y diseño d... -0.030861 \n", + "career_licenciatura en producción de bioimagenes -0.031139 \n", + "career_licenciatura en psicología -0.029726 \n", + "career_licenciatura en relaciones del trabajo -0.031139 \n", + "career_licenciatura en sociología -0.031415 \n", + "career_licenciatura en terapia ocupacional -0.031960 \n", + "career_medicina -0.030581 \n", + "career_técnico para bioterios -0.029144 \n", + "\n", + " ... \\\n", + "gender_female ... \n", + "gender_male ... \n", + "career_actuario ... \n", + "career_agronomía ... \n", + "career_arquitectura ... \n", + "career_bioquímica ... \n", + "career_ciencias veterinarias ... \n", + "career_contador público ... \n", + "career_diseño de imagen y sonido ... \n", + "career_diseño industrial ... \n", + "career_farmacia ... \n", + "career_ingeniería electrónica ... \n", + "career_ingeniería en informática ... \n", + "career_ingeniería mecánica ... \n", + "career_licenciatura en administración ... \n", + "career_licenciatura en artes ... \n", + "career_licenciatura en ciencia política ... \n", + "career_licenciatura en ciencia y tecnología de ... ... \n", + "career_licenciatura en ciencias ambientales ... \n", + "career_licenciatura en ciencias antropológicas ... \n", + "career_licenciatura en ciencias biológicas ... \n", + "career_licenciatura en ciencias de la computación ... \n", + "career_licenciatura en ciencias de la educación ... \n", + "career_licenciatura en ciencias geológicas ... \n", + "career_licenciatura en gestión de agroalimentos ... \n", + "career_licenciatura en kinesiología y fisiatría ... \n", + "career_licenciatura en musicoterapia ... \n", + "career_licenciatura en planificación y diseño d... ... \n", + "career_licenciatura en producción de bioimagenes ... \n", + "career_licenciatura en psicología ... \n", + "career_licenciatura en relaciones del trabajo ... \n", + "career_licenciatura en sociología ... \n", + "career_licenciatura en terapia ocupacional ... \n", + "career_medicina ... \n", + "career_técnico para bioterios ... \n", + "\n", + " career_licenciatura en kinesiología y fisiatría \\\n", + "gender_female 0.019595 \n", + "gender_male -0.019595 \n", + "career_actuario -0.030842 \n", + "career_agronomía -0.028758 \n", + "career_arquitectura -0.025860 \n", + "career_bioquímica -0.029667 \n", + "career_ciencias veterinarias -0.030842 \n", + "career_contador público -0.034415 \n", + "career_diseño de imagen y sonido -0.033080 \n", + "career_diseño industrial -0.031415 \n", + "career_farmacia -0.033080 \n", + "career_ingeniería electrónica -0.029965 \n", + "career_ingeniería en informática -0.031978 \n", + "career_ingeniería mecánica -0.031415 \n", + "career_licenciatura en administración -0.033080 \n", + "career_licenciatura en artes -0.030260 \n", + "career_licenciatura en ciencia política -0.032533 \n", + "career_licenciatura en ciencia y tecnología de ... -0.030260 \n", + "career_licenciatura en ciencias ambientales -0.030260 \n", + "career_licenciatura en ciencias antropológicas -0.035706 \n", + "career_licenciatura en ciencias biológicas -0.032257 \n", + "career_licenciatura en ciencias de la computación -0.033351 \n", + "career_licenciatura en ciencias de la educación -0.031415 \n", + "career_licenciatura en ciencias geológicas -0.031698 \n", + "career_licenciatura en gestión de agroalimentos -0.032257 \n", + "career_licenciatura en kinesiología y fisiatría 1.000000 \n", + "career_licenciatura en musicoterapia -0.034936 \n", + "career_licenciatura en planificación y diseño d... -0.031415 \n", + "career_licenciatura en producción de bioimagenes -0.031698 \n", + "career_licenciatura en psicología -0.030260 \n", + "career_licenciatura en relaciones del trabajo -0.031698 \n", + "career_licenciatura en sociología -0.031978 \n", + "career_licenciatura en terapia ocupacional -0.032533 \n", + "career_medicina -0.031129 \n", + "career_técnico para bioterios -0.029667 \n", + "\n", + " career_licenciatura en musicoterapia \\\n", + "gender_female -0.014009 \n", + "gender_male 0.014009 \n", + "career_actuario -0.033695 \n", + "career_agronomía -0.031418 \n", + "career_arquitectura -0.028252 \n", + "career_bioquímica -0.032411 \n", + "career_ciencias veterinarias -0.033695 \n", + "career_contador público -0.037598 \n", + "career_diseño de imagen y sonido -0.036140 \n", + "career_diseño industrial -0.034320 \n", + "career_farmacia -0.036140 \n", + "career_ingeniería electrónica -0.032736 \n", + "career_ingeniería en informática -0.034936 \n", + "career_ingeniería mecánica -0.034320 \n", + "career_licenciatura en administración -0.036140 \n", + "career_licenciatura en artes -0.033059 \n", + "career_licenciatura en ciencia política -0.035543 \n", + "career_licenciatura en ciencia y tecnología de ... -0.033059 \n", + "career_licenciatura en ciencias ambientales -0.033059 \n", + "career_licenciatura en ciencias antropológicas -0.039009 \n", + "career_licenciatura en ciencias biológicas -0.035241 \n", + "career_licenciatura en ciencias de la computación -0.036436 \n", + "career_licenciatura en ciencias de la educación -0.034320 \n", + "career_licenciatura en ciencias geológicas -0.034630 \n", + "career_licenciatura en gestión de agroalimentos -0.035241 \n", + "career_licenciatura en kinesiología y fisiatría -0.034936 \n", + "career_licenciatura en musicoterapia 1.000000 \n", + "career_licenciatura en planificación y diseño d... -0.034320 \n", + "career_licenciatura en producción de bioimagenes -0.034630 \n", + "career_licenciatura en psicología -0.033059 \n", + "career_licenciatura en relaciones del trabajo -0.034630 \n", + "career_licenciatura en sociología -0.034936 \n", + "career_licenciatura en terapia ocupacional -0.035543 \n", + "career_medicina -0.034009 \n", + "career_técnico para bioterios -0.032411 \n", + "\n", + " career_licenciatura en planificación y diseño del paisaje \\\n", + "gender_female 0.044869 \n", + "gender_male -0.044869 \n", + "career_actuario -0.030298 \n", + "career_agronomía -0.028251 \n", + "career_arquitectura -0.025404 \n", + "career_bioquímica -0.029144 \n", + "career_ciencias veterinarias -0.030298 \n", + "career_contador público -0.033808 \n", + "career_diseño de imagen y sonido -0.032497 \n", + "career_diseño industrial -0.030861 \n", + "career_farmacia -0.032497 \n", + "career_ingeniería electrónica -0.029436 \n", + "career_ingeniería en informática -0.031415 \n", + "career_ingeniería mecánica -0.030861 \n", + "career_licenciatura en administración -0.032497 \n", + "career_licenciatura en artes -0.029726 \n", + "career_licenciatura en ciencia política -0.031960 \n", + "career_licenciatura en ciencia y tecnología de ... -0.029726 \n", + "career_licenciatura en ciencias ambientales -0.029726 \n", + "career_licenciatura en ciencias antropológicas -0.035077 \n", + "career_licenciatura en ciencias biológicas -0.031688 \n", + "career_licenciatura en ciencias de la computación -0.032763 \n", + "career_licenciatura en ciencias de la educación -0.030861 \n", + "career_licenciatura en ciencias geológicas -0.031139 \n", + "career_licenciatura en gestión de agroalimentos -0.031688 \n", + "career_licenciatura en kinesiología y fisiatría -0.031415 \n", + "career_licenciatura en musicoterapia -0.034320 \n", + "career_licenciatura en planificación y diseño d... 1.000000 \n", + "career_licenciatura en producción de bioimagenes -0.031139 \n", + "career_licenciatura en psicología -0.029726 \n", + "career_licenciatura en relaciones del trabajo -0.031139 \n", + "career_licenciatura en sociología -0.031415 \n", + "career_licenciatura en terapia ocupacional -0.031960 \n", + "career_medicina -0.030581 \n", + "career_técnico para bioterios -0.029144 \n", + "\n", + " career_licenciatura en producción de bioimagenes \\\n", + "gender_female 0.022949 \n", + "gender_male -0.022949 \n", + "career_actuario -0.030571 \n", + "career_agronomía -0.028506 \n", + "career_arquitectura -0.025633 \n", + "career_bioquímica -0.029407 \n", + "career_ciencias veterinarias -0.030571 \n", + "career_contador público -0.034113 \n", + "career_diseño de imagen y sonido -0.032790 \n", + "career_diseño industrial -0.031139 \n", + "career_farmacia -0.032790 \n", + "career_ingeniería electrónica -0.029702 \n", + "career_ingeniería en informática -0.031698 \n", + "career_ingeniería mecánica -0.031139 \n", + "career_licenciatura en administración -0.032790 \n", + "career_licenciatura en artes -0.029994 \n", + "career_licenciatura en ciencia política -0.032248 \n", + "career_licenciatura en ciencia y tecnología de ... -0.029994 \n", + "career_licenciatura en ciencias ambientales -0.029994 \n", + "career_licenciatura en ciencias antropológicas -0.035393 \n", + "career_licenciatura en ciencias biológicas -0.031974 \n", + "career_licenciatura en ciencias de la computación -0.033058 \n", + "career_licenciatura en ciencias de la educación -0.031139 \n", + "career_licenciatura en ciencias geológicas -0.031419 \n", + "career_licenciatura en gestión de agroalimentos -0.031974 \n", + "career_licenciatura en kinesiología y fisiatría -0.031698 \n", + "career_licenciatura en musicoterapia -0.034630 \n", + "career_licenciatura en planificación y diseño d... -0.031139 \n", + "career_licenciatura en producción de bioimagenes 1.000000 \n", + "career_licenciatura en psicología -0.029994 \n", + "career_licenciatura en relaciones del trabajo -0.031419 \n", + "career_licenciatura en sociología -0.031698 \n", + "career_licenciatura en terapia ocupacional -0.032248 \n", + "career_medicina -0.030856 \n", + "career_técnico para bioterios -0.029407 \n", + "\n", + " career_licenciatura en psicología \\\n", + "gender_female -0.004099 \n", + "gender_male 0.004099 \n", + "career_actuario -0.029184 \n", + "career_agronomía -0.027212 \n", + "career_arquitectura -0.024470 \n", + "career_bioquímica -0.028073 \n", + "career_ciencias veterinarias -0.029184 \n", + "career_contador público -0.032565 \n", + "career_diseño de imagen y sonido -0.031302 \n", + "career_diseño industrial -0.029726 \n", + "career_farmacia -0.031302 \n", + "career_ingeniería electrónica -0.028354 \n", + "career_ingeniería en informática -0.030260 \n", + "career_ingeniería mecánica -0.029726 \n", + "career_licenciatura en administración -0.031302 \n", + "career_licenciatura en artes -0.028633 \n", + "career_licenciatura en ciencia política -0.030785 \n", + "career_licenciatura en ciencia y tecnología de ... -0.028633 \n", + "career_licenciatura en ciencias ambientales -0.028633 \n", + "career_licenciatura en ciencias antropológicas -0.033787 \n", + "career_licenciatura en ciencias biológicas -0.030523 \n", + "career_licenciatura en ciencias de la computación -0.031558 \n", + "career_licenciatura en ciencias de la educación -0.029726 \n", + "career_licenciatura en ciencias geológicas -0.029994 \n", + "career_licenciatura en gestión de agroalimentos -0.030523 \n", + "career_licenciatura en kinesiología y fisiatría -0.030260 \n", + "career_licenciatura en musicoterapia -0.033059 \n", + "career_licenciatura en planificación y diseño d... -0.029726 \n", + "career_licenciatura en producción de bioimagenes -0.029994 \n", + "career_licenciatura en psicología 1.000000 \n", + "career_licenciatura en relaciones del trabajo -0.029994 \n", + "career_licenciatura en sociología -0.030260 \n", + "career_licenciatura en terapia ocupacional -0.030785 \n", + "career_medicina -0.029456 \n", + "career_técnico para bioterios -0.028073 \n", + "\n", + " career_licenciatura en relaciones del trabajo \\\n", + "gender_female -0.007641 \n", + "gender_male 0.007641 \n", + "career_actuario -0.030571 \n", + "career_agronomía -0.028506 \n", + "career_arquitectura -0.025633 \n", + "career_bioquímica -0.029407 \n", + "career_ciencias veterinarias -0.030571 \n", + "career_contador público -0.034113 \n", + "career_diseño de imagen y sonido -0.032790 \n", + "career_diseño industrial -0.031139 \n", + "career_farmacia -0.032790 \n", + "career_ingeniería electrónica -0.029702 \n", + "career_ingeniería en informática -0.031698 \n", + "career_ingeniería mecánica -0.031139 \n", + "career_licenciatura en administración -0.032790 \n", + "career_licenciatura en artes -0.029994 \n", + "career_licenciatura en ciencia política -0.032248 \n", + "career_licenciatura en ciencia y tecnología de ... -0.029994 \n", + "career_licenciatura en ciencias ambientales -0.029994 \n", + "career_licenciatura en ciencias antropológicas -0.035393 \n", + "career_licenciatura en ciencias biológicas -0.031974 \n", + "career_licenciatura en ciencias de la computación -0.033058 \n", + "career_licenciatura en ciencias de la educación -0.031139 \n", + "career_licenciatura en ciencias geológicas -0.031419 \n", + "career_licenciatura en gestión de agroalimentos -0.031974 \n", + "career_licenciatura en kinesiología y fisiatría -0.031698 \n", + "career_licenciatura en musicoterapia -0.034630 \n", + "career_licenciatura en planificación y diseño d... -0.031139 \n", + "career_licenciatura en producción de bioimagenes -0.031419 \n", + "career_licenciatura en psicología -0.029994 \n", + "career_licenciatura en relaciones del trabajo 1.000000 \n", + "career_licenciatura en sociología -0.031698 \n", + "career_licenciatura en terapia ocupacional -0.032248 \n", + "career_medicina -0.030856 \n", + "career_técnico para bioterios -0.029407 \n", + "\n", + " career_licenciatura en sociología \\\n", + "gender_female 0.025663 \n", + "gender_male -0.025663 \n", + "career_actuario -0.030842 \n", + "career_agronomía -0.028758 \n", + "career_arquitectura -0.025860 \n", + "career_bioquímica -0.029667 \n", + "career_ciencias veterinarias -0.030842 \n", + "career_contador público -0.034415 \n", + "career_diseño de imagen y sonido -0.033080 \n", + "career_diseño industrial -0.031415 \n", + "career_farmacia -0.033080 \n", + "career_ingeniería electrónica -0.029965 \n", + "career_ingeniería en informática -0.031978 \n", + "career_ingeniería mecánica -0.031415 \n", + "career_licenciatura en administración -0.033080 \n", + "career_licenciatura en artes -0.030260 \n", + "career_licenciatura en ciencia política -0.032533 \n", + "career_licenciatura en ciencia y tecnología de ... -0.030260 \n", + "career_licenciatura en ciencias ambientales -0.030260 \n", + "career_licenciatura en ciencias antropológicas -0.035706 \n", + "career_licenciatura en ciencias biológicas -0.032257 \n", + "career_licenciatura en ciencias de la computación -0.033351 \n", + "career_licenciatura en ciencias de la educación -0.031415 \n", + "career_licenciatura en ciencias geológicas -0.031698 \n", + "career_licenciatura en gestión de agroalimentos -0.032257 \n", + "career_licenciatura en kinesiología y fisiatría -0.031978 \n", + "career_licenciatura en musicoterapia -0.034936 \n", + "career_licenciatura en planificación y diseño d... -0.031415 \n", + "career_licenciatura en producción de bioimagenes -0.031698 \n", + "career_licenciatura en psicología -0.030260 \n", + "career_licenciatura en relaciones del trabajo -0.031698 \n", + "career_licenciatura en sociología 1.000000 \n", + "career_licenciatura en terapia ocupacional -0.032533 \n", + "career_medicina -0.031129 \n", + "career_técnico para bioterios -0.029667 \n", + "\n", + " career_licenciatura en terapia ocupacional \\\n", + "gender_female 0.001113 \n", + "gender_male -0.001113 \n", + "career_actuario -0.031377 \n", + "career_agronomía -0.029257 \n", + "career_arquitectura -0.026308 \n", + "career_bioquímica -0.030182 \n", + "career_ciencias veterinarias -0.031377 \n", + "career_contador público -0.035012 \n", + "career_diseño de imagen y sonido -0.033655 \n", + "career_diseño industrial -0.031960 \n", + "career_farmacia -0.033655 \n", + "career_ingeniería electrónica -0.030485 \n", + "career_ingeniería en informática -0.032533 \n", + "career_ingeniería mecánica -0.031960 \n", + "career_licenciatura en administración -0.033655 \n", + "career_licenciatura en artes -0.030785 \n", + "career_licenciatura en ciencia política -0.033098 \n", + "career_licenciatura en ciencia y tecnología de ... -0.030785 \n", + "career_licenciatura en ciencias ambientales -0.030785 \n", + "career_licenciatura en ciencias antropológicas -0.036326 \n", + "career_licenciatura en ciencias biológicas -0.032817 \n", + "career_licenciatura en ciencias de la computación -0.033930 \n", + "career_licenciatura en ciencias de la educación -0.031960 \n", + "career_licenciatura en ciencias geológicas -0.032248 \n", + "career_licenciatura en gestión de agroalimentos -0.032817 \n", + "career_licenciatura en kinesiología y fisiatría -0.032533 \n", + "career_licenciatura en musicoterapia -0.035543 \n", + "career_licenciatura en planificación y diseño d... -0.031960 \n", + "career_licenciatura en producción de bioimagenes -0.032248 \n", + "career_licenciatura en psicología -0.030785 \n", + "career_licenciatura en relaciones del trabajo -0.032248 \n", + "career_licenciatura en sociología -0.032533 \n", + "career_licenciatura en terapia ocupacional 1.000000 \n", + "career_medicina -0.031670 \n", + "career_técnico para bioterios -0.030182 \n", + "\n", + " career_medicina \\\n", + "gender_female -0.007504 \n", + "gender_male 0.007504 \n", + "career_actuario -0.030023 \n", + "career_agronomía -0.027995 \n", + "career_arquitectura -0.025173 \n", + "career_bioquímica -0.028880 \n", + "career_ciencias veterinarias -0.030023 \n", + "career_contador público -0.033501 \n", + "career_diseño de imagen y sonido -0.032202 \n", + "career_diseño industrial -0.030581 \n", + "career_farmacia -0.032202 \n", + "career_ingeniería electrónica -0.029169 \n", + "career_ingeniería en informática -0.031129 \n", + "career_ingeniería mecánica -0.030581 \n", + "career_licenciatura en administración -0.032202 \n", + "career_licenciatura en artes -0.029456 \n", + "career_licenciatura en ciencia política -0.031670 \n", + "career_licenciatura en ciencia y tecnología de ... -0.029456 \n", + "career_licenciatura en ciencias ambientales -0.029456 \n", + "career_licenciatura en ciencias antropológicas -0.034758 \n", + "career_licenciatura en ciencias biológicas -0.031401 \n", + "career_licenciatura en ciencias de la computación -0.032466 \n", + "career_licenciatura en ciencias de la educación -0.030581 \n", + "career_licenciatura en ciencias geológicas -0.030856 \n", + "career_licenciatura en gestión de agroalimentos -0.031401 \n", + "career_licenciatura en kinesiología y fisiatría -0.031129 \n", + "career_licenciatura en musicoterapia -0.034009 \n", + "career_licenciatura en planificación y diseño d... -0.030581 \n", + "career_licenciatura en producción de bioimagenes -0.030856 \n", + "career_licenciatura en psicología -0.029456 \n", + "career_licenciatura en relaciones del trabajo -0.030856 \n", + "career_licenciatura en sociología -0.031129 \n", + "career_licenciatura en terapia ocupacional -0.031670 \n", + "career_medicina 1.000000 \n", + "career_técnico para bioterios -0.028880 \n", + "\n", + " career_técnico para bioterios \n", + "gender_female 0.028664 \n", + "gender_male -0.028664 \n", + "career_actuario -0.028613 \n", + "career_agronomía -0.026680 \n", + "career_arquitectura -0.023991 \n", + "career_bioquímica -0.027523 \n", + "career_ciencias veterinarias -0.028613 \n", + "career_contador público -0.031928 \n", + "career_diseño de imagen y sonido -0.030690 \n", + "career_diseño industrial -0.029144 \n", + "career_farmacia -0.030690 \n", + "career_ingeniería electrónica -0.027799 \n", + "career_ingeniería en informática -0.029667 \n", + "career_ingeniería mecánica -0.029144 \n", + "career_licenciatura en administración -0.030690 \n", + "career_licenciatura en artes -0.028073 \n", + "career_licenciatura en ciencia política -0.030182 \n", + "career_licenciatura en ciencia y tecnología de ... -0.028073 \n", + "career_licenciatura en ciencias ambientales -0.028073 \n", + "career_licenciatura en ciencias antropológicas -0.033126 \n", + "career_licenciatura en ciencias biológicas -0.029926 \n", + "career_licenciatura en ciencias de la computación -0.030941 \n", + "career_licenciatura en ciencias de la educación -0.029144 \n", + "career_licenciatura en ciencias geológicas -0.029407 \n", + "career_licenciatura en gestión de agroalimentos -0.029926 \n", + "career_licenciatura en kinesiología y fisiatría -0.029667 \n", + "career_licenciatura en musicoterapia -0.032411 \n", + "career_licenciatura en planificación y diseño d... -0.029144 \n", + "career_licenciatura en producción de bioimagenes -0.029407 \n", + "career_licenciatura en psicología -0.028073 \n", + "career_licenciatura en relaciones del trabajo -0.029407 \n", + "career_licenciatura en sociología -0.029667 \n", + "career_licenciatura en terapia ocupacional -0.030182 \n", + "career_medicina -0.028880 \n", + "career_técnico para bioterios 1.000000 \n", + "\n", + "[35 rows x 35 columns]" + ] + }, + "execution_count": 122, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "correlacion2 = dft2.corr()\n", + "# correlacion\n", + "correlacion2\n", + "# sns.heatmap(correlacion[0:5],xticklabels=correlacion.columns[0:5],yticklabels=correlacion.columns[0:5],annot=True)\n", + "# plt.show()" + ] + }, + { + "cell_type": "code", + "execution_count": 123, + "id": "8753f7e0", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
gender_femalegender_malecareer_actuariocareer_agronomíacareer_arquitecturacareer_bioquímicacareer_ciencias veterinariascareer_contador públicocareer_diseño de imagen y sonidocareer_diseño industrial...career_licenciatura en kinesiología y fisiatríacareer_licenciatura en musicoterapiacareer_licenciatura en planificación y diseño del paisajecareer_licenciatura en producción de bioimagenescareer_licenciatura en psicologíacareer_licenciatura en relaciones del trabajocareer_licenciatura en sociologíacareer_licenciatura en terapia ocupacionalcareer_medicinacareer_técnico para bioterios
gender_female1.000000-1.0000000.0647560.019895-0.0322130.0026160.027091-0.025293-0.0167910.007851...0.019595-0.0140090.0448690.022949-0.004099-0.0076410.0256630.001113-0.0075040.028664
gender_male-1.0000001.000000-0.064756-0.0198950.032213-0.002616-0.0270910.0252930.016791-0.007851...-0.0195950.014009-0.044869-0.0229490.0040990.007641-0.025663-0.0011130.007504-0.028664
career_actuario0.064756-0.0647561.000000-0.027736-0.024941-0.028613-0.029746-0.033192-0.031905-0.030298...-0.030842-0.033695-0.030298-0.030571-0.029184-0.030571-0.030842-0.031377-0.030023-0.028613
career_agronomía0.019895-0.019895-0.0277361.000000-0.023255-0.026680-0.027736-0.030949-0.029749-0.028251...-0.028758-0.031418-0.028251-0.028506-0.027212-0.028506-0.028758-0.029257-0.027995-0.026680
career_arquitectura-0.0322130.032213-0.024941-0.0232551.000000-0.023991-0.024941-0.027830-0.026751-0.025404...-0.025860-0.028252-0.025404-0.025633-0.024470-0.025633-0.025860-0.026308-0.025173-0.023991
\n", + "

5 rows × 35 columns

\n", + "
" + ], + "text/plain": [ + " gender_female gender_male career_actuario \\\n", + "gender_female 1.000000 -1.000000 0.064756 \n", + "gender_male -1.000000 1.000000 -0.064756 \n", + "career_actuario 0.064756 -0.064756 1.000000 \n", + "career_agronomía 0.019895 -0.019895 -0.027736 \n", + "career_arquitectura -0.032213 0.032213 -0.024941 \n", + "\n", + " career_agronomía career_arquitectura career_bioquímica \\\n", + "gender_female 0.019895 -0.032213 0.002616 \n", + "gender_male -0.019895 0.032213 -0.002616 \n", + "career_actuario -0.027736 -0.024941 -0.028613 \n", + "career_agronomía 1.000000 -0.023255 -0.026680 \n", + "career_arquitectura -0.023255 1.000000 -0.023991 \n", + "\n", + " career_ciencias veterinarias career_contador público \\\n", + "gender_female 0.027091 -0.025293 \n", + "gender_male -0.027091 0.025293 \n", + "career_actuario -0.029746 -0.033192 \n", + "career_agronomía -0.027736 -0.030949 \n", + "career_arquitectura -0.024941 -0.027830 \n", + "\n", + " career_diseño de imagen y sonido \\\n", + "gender_female -0.016791 \n", + "gender_male 0.016791 \n", + "career_actuario -0.031905 \n", + "career_agronomía -0.029749 \n", + "career_arquitectura -0.026751 \n", + "\n", + " career_diseño industrial ... \\\n", + "gender_female 0.007851 ... \n", + "gender_male -0.007851 ... \n", + "career_actuario -0.030298 ... \n", + "career_agronomía -0.028251 ... \n", + "career_arquitectura -0.025404 ... \n", + "\n", + " career_licenciatura en kinesiología y fisiatría \\\n", + "gender_female 0.019595 \n", + "gender_male -0.019595 \n", + "career_actuario -0.030842 \n", + "career_agronomía -0.028758 \n", + "career_arquitectura -0.025860 \n", + "\n", + " career_licenciatura en musicoterapia \\\n", + "gender_female -0.014009 \n", + "gender_male 0.014009 \n", + "career_actuario -0.033695 \n", + "career_agronomía -0.031418 \n", + "career_arquitectura -0.028252 \n", + "\n", + " career_licenciatura en planificación y diseño del paisaje \\\n", + "gender_female 0.044869 \n", + "gender_male -0.044869 \n", + "career_actuario -0.030298 \n", + "career_agronomía -0.028251 \n", + "career_arquitectura -0.025404 \n", + "\n", + " career_licenciatura en producción de bioimagenes \\\n", + "gender_female 0.022949 \n", + "gender_male -0.022949 \n", + "career_actuario -0.030571 \n", + "career_agronomía -0.028506 \n", + "career_arquitectura -0.025633 \n", + "\n", + " career_licenciatura en psicología \\\n", + "gender_female -0.004099 \n", + "gender_male 0.004099 \n", + "career_actuario -0.029184 \n", + "career_agronomía -0.027212 \n", + "career_arquitectura -0.024470 \n", + "\n", + " career_licenciatura en relaciones del trabajo \\\n", + "gender_female -0.007641 \n", + "gender_male 0.007641 \n", + "career_actuario -0.030571 \n", + "career_agronomía -0.028506 \n", + "career_arquitectura -0.025633 \n", + "\n", + " career_licenciatura en sociología \\\n", + "gender_female 0.025663 \n", + "gender_male -0.025663 \n", + "career_actuario -0.030842 \n", + "career_agronomía -0.028758 \n", + "career_arquitectura -0.025860 \n", + "\n", + " career_licenciatura en terapia ocupacional \\\n", + "gender_female 0.001113 \n", + "gender_male -0.001113 \n", + "career_actuario -0.031377 \n", + "career_agronomía -0.029257 \n", + "career_arquitectura -0.026308 \n", + "\n", + " career_medicina career_técnico para bioterios \n", + "gender_female -0.007504 0.028664 \n", + "gender_male 0.007504 -0.028664 \n", + "career_actuario -0.030023 -0.028613 \n", + "career_agronomía -0.027995 -0.026680 \n", + "career_arquitectura -0.025173 -0.023991 \n", + "\n", + "[5 rows x 35 columns]" + ] + }, + "execution_count": 123, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "correlacion2[0:5]" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "72cf1ae3", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "80dbff0e", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "47b32000", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "b8ee6911", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "69744bbb", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "d8f63f8d", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": 124, + "id": "c2d2937a", + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "iVBORw0KGgoAAAANSUhEUgAAAmoAAAFlCAYAAABbbMQ3AAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjQuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8rg+JYAAAACXBIWXMAAAsTAAALEwEAmpwYAAAgWklEQVR4nO3deZxkVX338c8XBmRxAWQkwIyOEQTRuI6IcYkRo6JRjAHjFlGJxESjxrglUSEaH/XRxGgSNSgIuKCEqKBxCQIaDREzKC5ADBMQBxhklGERHhT09/xxT0PRdE83w3TXme7P+/Wq19x7z61Tv7pV0/3tc+6tSlUhSZKk/mwx7gIkSZI0NYOaJElSpwxqkiRJnTKoSZIkdcqgJkmS1CmDmiRJUqcMatI8SnJOksds5H3vnuSnSbbctFVBkkqyx6budy4lOSLJR8Zdx1Ruz+t8Ox7z/UnesIH2jX6Nk/wgyeNmue/zk3xtlvsek+SvN6amDfQ5J++LJI9JcvGm7leayZJxFyCNS5IfAH9QVV+ar8esqvvOdt/J9VXVD4E7zlFp2oRuy+u8CR/zxfP9mJLmniNq0jxI4h9Fnchgs/vZ53to8zUXo+BaPDa7H1bSXJiYrknyziTrk1yY5IBJ7Rckuaa1PWek7UVJzmtt5yZ5cNv+gySvTfId4NokS0ankNoUzYlJPtHu+80kD2htHwbuDnymTXe+JsmKNn21pO2zW5KTk1yRZHWSF43UdESSE5Ic1/o+J8nKGQ7Dk9pz/HGSdyTZIsnWrf9fG+n7bkmuS7J0iuO4ZZK/aX1cmOSlk2q+S5KjkqxNckmSv574JTaL1+CeSb7Sns8pwM6THnu/JGckuTLJt0enHpN8OclbkvwHcB3wqxs6EFNNc03x2k17fCf2ba/R/0uy00jbg9rx2aqtv7C9f9Yn+WKSe4zsW0lekuR84PwWMt+V5PIkVyf5bpL7tX1vMY2Y5NXtOF+a5IWTnsuTk3yr9bEmyRGT2n8/yUVJfpLkL2c4Vndt78Ork3wDuNek9r2TnNLeR99P8owN9Tdyvz3a631VO16fGGl7d6v76iRnJXnUNH18PslLJ237dpKnz9RPkm3bMV2f5FzgoZP6uU97X13ZXv+njrQdk+R9ST6X5FrgN2fznKUpVZU3b4vyBvwAeFxbfj5wA/AiYEvgj4BLgQDbA1cDe7V9dwXu25YPBi5h+CEeYA/gHiP9nw0sB7ad4jGPaI95ELAV8CrgQmCryfu29RVAAUva+r8D7wW2AR4IrAMeO9L39cCT2vN5K/D1DRyLAk4HdmIIiP/DMO1Ke4y3j+z7cuAz0/TzYuBcYBmwI/ClSTV/CvindkzvBnwD+MOZXoPW/p/A3wJ3AB4NXAN8pLXtDvykPd8tgN9q60tb+5eBHwL3ZTjlYyvgs8DrpnkejwEu3sD7ZYPHd9K+pwEvGml7B/D+tnwgsBq4T6vr9cAZk16XU9rrsi3wBOAsYAeG99t9gF3bvscAf92Wnwj8CLhfO9Yfa33tMfL8fq0dq/u3fZ/W2vYBftqO8R3aMb+RkffipOPyceCE9jj3Y/j/8LXWtj2wBnhBe34PAn4M7DO55in6PR74y1bjNsAjR9qeC9y19flnwGXANiOvzcT74nnAf4zcbx/gSuAOs+jnbcBX27FfDnxv4j3B8P5ZDfwFsDXwWIb3414jz+sq4BET9Y/75523zfc29gK8eRvXjVsHtdUjbdu1X2y/0n7ZXAn8Li1wjez3ReDlG+j/hRt4zCO45S/3LYC1wKMm79vWV7SalrRfHL8A7jTS/lbgmJG+vzTStg/w/zZwLAp44sj6HwOntuWHMYScicC0CnjGNP2cRgtebf1xIzXvAvxs9BgCzwJOn8VrcHeGsLD9SPvHuPkX8muBD0/x2hzSlr8MvOk2vDcew8xBbdrjO2nfPwBOa8thCC6PbuufBw6d9B64jpvDftHCd1t/LEOI3g/YYlJ9x3BzUDsaeNtI270ZCWpTPN+/A97Vlt8IfHykbXvg50wR1BhC6g3A3iPb/g83B7XfA7466T7/BBw+ueYp+j4OOBJYNovXaz3wgJHXZuJ9cSfg2pHj+Rbg6Fn2cwG3/D9xGDcHtUcxhLotRtqPB44YeV7Hzfb95s3bhm5OfUo3u2xioaqua4t3rKprGX7hvBhYm+Rfk+zd2pcD/7uBPtfM8Jg3tVfVL4GLgd1mUetuwBVVdc3ItosYRpYmXDayfB2wTTZ8ntNorRdN1FFVZ7b7P6Y97z2AkzdQ12g/o8v3YBiJWNumi65k+KV9t6lqHn0NWr/r22sxWuNo3wdP9Nv6fiTD6OdUtWwKsz2+/wI8PMmuDKNUv2QYqZmo+90jNV/BEOZGX8fR98hpwD8A/whcnuTIJHee4jEnvw6jx4okD0tyepJ1Sa5ieG/vPNV92zH/yRSPAbCUIYRP91j3AB426XV5DkP4nslrGI7FN9rU4k3Tt0le1aaLr2p93oVJU+Gt9muAfwWe2TY9C/joLPvZ0DHcDVjT/s+Otk/5ukm3h0FNmoWq+mJV/RbDL/7/Bj7QmtYw6ZycyXedoevlEwsZTnBfxjDdN9N9LwV2SnKnkW13Z5h22ljLR5bvPlIHwLEM00S/D5xYVddP08dahucwVZ9rGEbUdq6qHdrtzjW7KyTXAjsm2X5SjaN9f3ik3x2qavuqetvIPjO9FqOuZRjRA246GfxW5+TNRlWtB/6NIew/m2G0aqKWNQwjkKN1b1tVZ0xXd1W9p6oewjCKd2/g1VM87Fpu/XqO+hhD2F5eVXcB3s8Qim513yTbMUwPTmUdw0jndI+1BvjKpOd3x6r6o2n6u0lVXVZVL6qq3YA/BN7bzlt7FEOIewawY1XtwDDNmGm6Oh54VpKHM0yhnt6e10z9bOgYXgoszy0vSpn8/++2vN+kaRnUpBkk2SXJgS0k/Izh/J2Jv6Q/CLwqyUPaid57ZORk8Fl4SJKnt5GYV7T+v97afsQ0J71X1RrgDOCtSbZJcn/gUOD2fH7Uq5PsmGQ5w3lonxhp+wjwOwxh7bgN9HEC8PIkuyfZgWFKcqLmtQyB5W+S3DnDxQr3SvIbMxVWVRcxTLn+VYYLHB4JPGVSfU9J8oQMFzRsk+GCgGVTdjiz/2EYIXtyhpP+X89wvtbG+hjD+VIHteUJ7wf+PMl94aaLLQ6erpMkD22jYVsxhMnrufm9OOoE4PlJ9mlB6/BJ7XdiGJG9Psm+DAFywonAbyd5ZJKtgTcxze+KqvoF8EngiCTbJdkHOGRkl88C985wccJW7fbQJPeZ7jmOPNeDR16/9QzB55et9hsZQuKSJG8EphpVnPA5hpG9NwGfGBkFm6mfExhemx1bHX8y0jYxyvya9pwew/B+/PhMz0u6rQxq0sy2AF7J8Ff0FcBvMJzoTlX9M8N5Lx9jOJn40wwnH8/WSQwjLesZRqueXlU3tLa3Aq9vU0avmuK+z2I4b+1ShpP0D6/b95lwJzGcqH42w3TRURMNLRh+k+GX5VenunPzAYYw9h3gWwy/JG9kOJ8OhrCyNcMFB+sZQsGut+5mSs9mOF/uCobgcVNgbPUdyHBy9zqGkZxXs4GfcRmuCPyLqdqq6iqG8/Q+yDBKci3DtPTGOhnYE7isqr498jifAt4OfDzJ1QwnrB8wdRfAECQ+wHDsLmKYknzHFPV/nuG8s9MYTno/bdIufwy8Kck1DOeknTBy33OAlzC8p9e2x9rQc38pw/T0ZQznZn1opK9rgMczTD1e2vZ5O7MLvQ8FzkzyU4bj9/KquoDh3MMvMITpixjC6rTTjFX1M4Yw+ThuGZJn6uev2vYLGd7THx7p8+cMwewAhosj3gs8r6r+exbPS7pNJk4OljTPMnwkwh5V9dxx1zIbSY4GLq2q19+G+xzAcIXjbRlllCQ1foCipBklWQE8neHjFTa037YMnxn1bwxXeR7OMNonSdoITn1K2qAkb2aYkntHVV040+4MU0brGaY+z2OYWpMkbQSnPiVJkjrliJokSVKnDGqSJEmdWpAXE+y88861YsWKcZchSZI0o7POOuvHVTXlh2ovyKC2YsUKVq1aNe4yJEmSZpTkounanPqUJEnqlEFNkiSpUwY1SZKkThnUJEmSOmVQkyRJ6tScBbUkRye5PMn3RrbtlOSUJOe3f3ds25PkPUlWJ/lOkgeP3OeQtv/5SQ6Zq3olSZJ6M5cjascAT5y07XXAqVW1J3BqWwc4ANiz3Q4D3gdDsGP4UueHAfsCh0+EO0mSpIVuzoJaVf07cMWkzQcCx7blY4GnjWw/rgZfB3ZIsivwBOCUqrqiqtYDp3Dr8CdJkrQgzfc5artU1dq2fBmwS1veHVgzst/Fbdt02yVJkha8sV1MUFUF1KbqL8lhSVYlWbVu3bpN1a0kSdLYzPdXSP0oya5VtbZNbV7etl8CLB/Zb1nbdgnwmEnbvzxVx1V1JHAkwMqVKzdZAJyNh7z6uPl8OEnNWe943rhLkKQ5Nd8jaicDE1duHgKcNLL9ee3qz/2Aq9oU6ReBxyfZsV1E8Pi2TZIkacGbsxG1JMczjIbtnORihqs33wackORQ4CLgGW33zwFPAlYD1wEvAKiqK5K8Gfivtt+bqmryBQqSJEkL0pwFtap61jRN+0+xbwEvmaafo4GjN2FpkiRJmwW/mUCSJKlTBjVJkqROGdQkSZI6ZVCTJEnqlEFNkiSpUwY1SZKkThnUJEmSOmVQkyRJ6pRBTZIkqVMGNUmSpE4Z1CRJkjplUJMkSeqUQU2SJKlTBjVJkqROGdQkSZI6ZVCTJEnqlEFNkiSpUwY1SZKkTi0ZdwGSpKn98E2/Nu4SpEXp7m/87rhLuIkjapIkSZ0yqEmSJHXKoCZJktQpg5okSVKnDGqSJEmdMqhJkiR1yqAmSZLUKYOaJElSpwxqkiRJnTKoSZIkdcqgJkmS1CmDmiRJUqcMapIkSZ0yqEmSJHXKoCZJktQpg5okSVKnDGqSJEmdMqhJkiR1yqAmSZLUKYOaJElSpwxqkiRJnTKoSZIkdcqgJkmS1CmDmiRJUqfGEtSS/GmSc5J8L8nxSbZJcs8kZyZZneQTSbZu+96hra9u7SvGUbMkSdJ8m/eglmR34GXAyqq6H7Al8Ezg7cC7qmoPYD1waLvLocD6tv1dbT9JkqQFb1xTn0uAbZMsAbYD1gKPBU5s7ccCT2vLB7Z1Wvv+STJ/pUqSJI3HvAe1qroEeCfwQ4aAdhVwFnBlVd3YdrsY2L0t7w6safe9se1/1/msWZIkaRzGMfW5I8Mo2T2B3YDtgSdugn4PS7Iqyap169bd3u4kSZLGbhxTn48DLqyqdVV1A/BJ4BHADm0qFGAZcElbvgRYDtDa7wL8ZHKnVXVkVa2sqpVLly6d6+cgSZI058YR1H4I7Jdku3au2f7AucDpwEFtn0OAk9ryyW2d1n5aVdU81itJkjQW4zhH7UyGiwK+CXy31XAk8FrglUlWM5yDdlS7y1HAXdv2VwKvm++aJUmSxmHJzLtselV1OHD4pM0XAPtOse/1wMHzUZckSVJP/GYCSZKkThnUJEmSOmVQkyRJ6pRBTZIkqVMGNUmSpE4Z1CRJkjplUJMkSeqUQU2SJKlTBjVJkqROGdQkSZI6ZVCTJEnqlEFNkiSpUwY1SZKkThnUJEmSOmVQkyRJ6pRBTZIkqVMGNUmSpE4Z1CRJkjplUJMkSeqUQU2SJKlTBjVJkqROGdQkSZI6ZVCTJEnqlEFNkiSpUwY1SZKkThnUJEmSOmVQkyRJ6pRBTZIkqVMGNUmSpE4Z1CRJkjplUJMkSeqUQU2SJKlTBjVJkqROGdQkSZI6ZVCTJEnqlEFNkiSpUwY1SZKkThnUJEmSOmVQkyRJ6pRBTZIkqVMGNUmSpE4Z1CRJkjplUJMkSeqUQU2SJKlTYwlqSXZIcmKS/05yXpKHJ9kpySlJzm//7tj2TZL3JFmd5DtJHjyOmiVJkubbuEbU3g18oar2Bh4AnAe8Dji1qvYETm3rAAcAe7bbYcD75r9cSZKk+TfvQS3JXYBHA0cBVNXPq+pK4EDg2LbbscDT2vKBwHE1+DqwQ5Jd57VoSZKkMRjHiNo9gXXAh5J8K8kHk2wP7FJVa9s+lwG7tOXdgTUj97+4bbuFJIclWZVk1bp16+awfEmSpPkxjqC2BHgw8L6qehBwLTdPcwJQVQXUbem0qo6sqpVVtXLp0qWbrFhJkqRxGUdQuxi4uKrObOsnMgS3H01MabZ/L2/tlwDLR+6/rG2TJEla0OY9qFXVZcCaJHu1TfsD5wInA4e0bYcAJ7Xlk4Hntas/9wOuGpkilSRJWrCWjOlx/wT4aJKtgQuAFzCExhOSHApcBDyj7fs54EnAauC6tq8kSdKCN5agVlVnAyunaNp/in0LeMlc1yRJktQbv5lAkiSpUwY1SZKkThnUJEmSOjWroJbk1NlskyRJ0qazwYsJkmwDbAfs3L4kPa3pzkzx7QCSJEnadGa66vMPgVcAuwFncXNQuxr4h7krS5IkSRsMalX1buDdSf6kqv5+nmqSJEkSs/wctar6+yS/DqwYvU9VHTdHdUmSJC16swpqST4M3As4G/hF21yAQU2SJGmOzPabCVYC+7RvCZAkSdI8mO3nqH0P+JW5LESSJEm3NNsRtZ2Bc5N8A/jZxMaqeuqcVCVJkqRZB7Uj5rIISZIk3dpsr/r8ylwXIkmSpFua7VWf1zBc5QmwNbAVcG1V3XmuCpMkSVrsZjuidqeJ5SQBDgT2m6uiJEmSNPurPm9Sg08DT9j05UiSJGnCbKc+nz6yugXD56pdPycVSZIkCZj9VZ9PGVm+EfgBw/SnJEmS5shsz1F7wVwXIkmSpFua1TlqSZYl+VSSy9vtX5Ism+viJEmSFrPZXkzwIeBkYLd2+0zbJkmSpDky26C2tKo+VFU3ttsxwNI5rEuSJGnRm21Q+0mS5ybZst2eC/xkLguTJEla7GYb1F4IPAO4DFgLHAQ8f45qkiRJErP/eI43AYdU1XqAJDsB72QIcJIkSZoDsx1Ru/9ESAOoqiuAB81NSZIkSYLZB7Utkuw4sdJG1GY7GidJkqSNMNuw9TfAfyb557Z+MPCWuSlJkiRJMPtvJjguySrgsW3T06vq3LkrS5IkSbOevmzBzHAmSZI0T2Z7jpokSZLmmUFNkiSpUwY1SZKkThnUJEmSOmVQkyRJ6pRBTZIkqVMGNUmSpE4Z1CRJkjplUJMkSeqUQU2SJKlTBjVJkqROGdQkSZI6NbaglmTLJN9K8tm2fs8kZyZZneQTSbZu2+/Q1le39hXjqlmSJGk+jXNE7eXAeSPrbwfeVVV7AOuBQ9v2Q4H1bfu72n6SJEkL3liCWpJlwJOBD7b1AI8FTmy7HAs8rS0f2NZp7fu3/SVJkha0cY2o/R3wGuCXbf2uwJVVdWNbvxjYvS3vDqwBaO1Xtf1vIclhSVYlWbVu3bo5LF2SJGl+zHtQS/LbwOVVddam7LeqjqyqlVW1cunSpZuya0mSpLFYMobHfATw1CRPArYB7gy8G9ghyZI2arYMuKTtfwmwHLg4yRLgLsBP5r9sSZKk+TXvI2pV9edVtayqVgDPBE6rqucApwMHtd0OAU5qyye3dVr7aVVV81iyJEnSWPT0OWqvBV6ZZDXDOWhHte1HAXdt218JvG5M9UmSJM2rcUx93qSqvgx8uS1fAOw7xT7XAwfPa2GSJEkd6GlETZIkSSMMapIkSZ0yqEmSJHXKoCZJktQpg5okSVKnDGqSJEmdMqhJkiR1yqAmSZLUKYOaJElSpwxqkiRJnTKoSZIkdcqgJkmS1CmDmiRJUqcMapIkSZ0yqEmSJHXKoCZJktQpg5okSVKnDGqSJEmdMqhJkiR1yqAmSZLUKYOaJElSpwxqkiRJnTKoSZIkdcqgJkmS1CmDmiRJUqcMapIkSZ0yqEmSJHXKoCZJktQpg5okSVKnDGqSJEmdMqhJkiR1yqAmSZLUKYOaJElSpwxqkiRJnTKoSZIkdcqgJkmS1CmDmiRJUqcMapIkSZ0yqEmSJHXKoCZJktQpg5okSVKnDGqSJEmdMqhJkiR1at6DWpLlSU5Pcm6Sc5K8vG3fKckpSc5v/+7YtifJe5KsTvKdJA+e75olSZLGYRwjajcCf1ZV+wD7AS9Jsg/wOuDUqtoTOLWtAxwA7NluhwHvm/+SJUmS5t+8B7WqWltV32zL1wDnAbsDBwLHtt2OBZ7Wlg8EjqvB14Edkuw6v1VLkiTNv7Geo5ZkBfAg4Exgl6pa25ouA3Zpy7sDa0budnHbNrmvw5KsSrJq3bp1c1e0JEnSPBlbUEtyR+BfgFdU1dWjbVVVQN2W/qrqyKpaWVUrly5dugkrlSRJGo+xBLUkWzGEtI9W1Sfb5h9NTGm2fy9v2y8Blo/cfVnbJkmStKCN46rPAEcB51XV3440nQwc0pYPAU4a2f68dvXnfsBVI1OkkiRJC9aSMTzmI4DfB76b5Oy27S+AtwEnJDkUuAh4Rmv7HPAkYDVwHfCCea1WkiRpTOY9qFXV14BM07z/FPsX8JI5LUqSJKlDfjOBJElSpwxqkiRJnTKoSZIkdcqgJkmS1CmDmiRJUqcMapIkSZ0yqEmSJHXKoCZJktQpg5okSVKnDGqSJEmdMqhJkiR1yqAmSZLUKYOaJElSpwxqkiRJnTKoSZIkdcqgJkmS1CmDmiRJUqcMapIkSZ0yqEmSJHXKoCZJktQpg5okSVKnDGqSJEmdMqhJkiR1yqAmSZLUKYOaJElSpwxqkiRJnTKoSZIkdcqgJkmS1CmDmiRJUqcMapIkSZ0yqEmSJHXKoCZJktQpg5okSVKnDGqSJEmdMqhJkiR1yqAmSZLUKYOaJElSpwxqkiRJnTKoSZIkdcqgJkmS1CmDmiRJUqcMapIkSZ0yqEmSJHVqswlqSZ6Y5PtJVid53bjrkSRJmmubRVBLsiXwj8ABwD7As5LsM96qJEmS5tZmEdSAfYHVVXVBVf0c+Dhw4JhrkiRJmlNLxl3ALO0OrBlZvxh42OgOSQ4DDmurP03y/XmqTZu/nYEfj7sI3XZ55yHjLkHaEH+2bK4Oz3w/4j2ma9hcgtqMqupI4Mhx16HNT5JVVbVy3HVIWlj82aJNYXOZ+rwEWD6yvqxtkyRJWrA2l6D2X8CeSe6ZZGvgmcDJY65JkiRpTm0WU59VdWOSlwJfBLYEjq6qc8ZclhYOp8wlzQV/tuh2S1WNuwZJkiRNYXOZ+pQkSVp0DGqSJEmdMqhJkiR1yqAmSZLUKYOaFp0k905yapLvtfX7J3n9uOuStDAk2TbJXuOuQwuDQU2L0QeAPwduAKiq7zB8Np8k3S5JngKcDXyhrT8wiZ/7qY1mUNNitF1VfWPSthvHUomkheYIYF/gSoCqOhu45/jK0ebOoKbF6MdJ7gUUQJKDgLXjLUnSAnFDVV01aZsfWKqNtll8M4G0ib2E4RPD905yCXAh8NzxliRpgTgnybOBLZPsCbwMOGPMNWkz5jcTaNFKsj2wRVVdM+5aJC0MSbYD/hJ4PBCGrz58c1VdP9bCtNkyqGnRSPLKDbVX1d/OVy2SJM2GU59aTO407gIkLUxJPsMGzkWrqqfOYzlaQBxRkyTpdkryGxtqr6qvzFctWlgMalp0kmwDHArcF9hmYntVvXBsRUmSNAU/nkOL0YeBXwGeAHwFWAZ4QYGk2y3JnklOTHJukgsmbuOuS5svg5oWoz2q6g3AtVV1LPBk4GFjrknSwvAh4H0MH6L9m8BxwEfGWpE2awY1LUY3tH+vTHI/4C7A3cZYj6SFY9uqOpXh1KKLquoIhj8GpY3iVZ9ajI5MsiPwBuBk4I7AG8dbkqQF4mdJtgDOT/JS4BKGnzHSRvFiAkmSNpEkDwXOA3YA3gzcGfi/VXXmOOvS5sugpkUnyQ7A84AVjIwqV9XLxlSSpAUiyUqGbya4B7BV21xVdf/xVaXNmVOfWow+B3wd+C7wyzHXImlh+Sjwavz5ok3EoKbFaJuq2uDXSUnSRlpXVSePuwgtHE59atFJ8qfAT4HPAj+b2F5VV4ytKEkLQpL9gWcBp3LLny+fHFtR2qw5oqbF6OfAOxjOI5n4S6WAXx1bRZIWihcAezOcnzYx9VmAQU0bxRE1LTrtU8L3raofj7sWSQtLku9X1V7jrkMLhx94q8VoNXDduIuQtCCdkWSfcRehhcOpTy1G1wJnJzmdW55D4sdzSLq99mP4+XIhw8+X4Mdz6HYwqGkx+nS7SdKm9sRxF6CFxXPUtCgl2Ra4e1V9f9y1SJI0Hc9R06KT5CnA2cAX2voDk/i5R5Kk7hjUtBgdAewLXAlQVWfjR3NIkjpkUNNidENVXTVpm1/1IknqjhcTaDE6J8mzgS2T7Am8DDhjzDVJknQrjqhp0Ujy4bb4v8B9GS6dPx64GnjFmMqSJGlaXvWpRSPJucDjgM8Dvzm53e/6lCT1xqlPLSbvZ/ii5F8FVo1sD37XpySpQ46oadFJ8r6q+qNx1yFJ0kwMapIkSZ3yYgJJkqROGdQkSZI6ZVCTpNshyTFJDhp3HZIWJoOaJM2jJF5tL2nWDGqSFo0kb0jy/SRfS3J8klcluVeSLyQ5K8lXk+zd9j0myXuSnJHkgolRswz+ofXzJeBuI/0/JMlXWl9fTLJr2/7lJH+XZBXw8nE8d0mbJ/+yk7QoJHko8LvAA4CtgG8CZwFHAi+uqvOTPAx4L/DYdrddgUcCewMnAycCvwPsBewD7AKcCxydZCvg74EDq2pdkt8D3gK8sPW1dVWtnPMnKmlBMahJWiweAZxUVdcD1yf5DLAN8OvAPyeZ2O8OI/f5dFX9Ejg3yS5t26OB46vqF8ClSU5r2/cC7gec0vraElg70tcn5uA5SVrgDGqSFrMtgCur6oHTtP9sZDnT7DPafk5VPXya9mtvY22S5DlqkhaN/wCekmSbJHcEfhu4DrgwycFw0/lnD5ihn38Hfi/Jlu0ctInvjf0+sDTJw1tfWyW575w8E0mLhkFN0qJQVf/FcJ7Zd4DPA98FrgKeAxya5NvAOcCBM3T1KeB8hnPTjgP+s/X/c+Ag4O2tr7MZplUlaaP5FVKSFo0kd6yqnybZjmFk7LCq+ua465Kk6XiOmqTF5Mgk+zBcRHCsIU1S7xxRkyRJ6pTnqEmSJHXKoCZJktQpg5okSVKnDGqSJEmdMqhJkiR1yqAmSZLUqf8PH3Hxbk0QMioAAAAASUVORK5CYII=", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "grafBar(df1.gender,df1.university[0])\n", + "grafBar(df2.gender,df2.university[0])" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "0c6f8bdf", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": 125, + "id": "b3e4945a", + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "grafBox(df1.gender,df1.age,df1.university[0])\n", + "grafBox(df2.gender,df2.age,df2.university[0])" + ] + }, + { + "cell_type": "code", + "execution_count": 126, + "id": "a0cc728f", + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "grafPie(df1,df1.gender,df1.university[0])\n", + "grafPie(df2,df2.gender,df2.university[0])\n", + "\n", + "\n", + "\n" + ] + }, + { + "cell_type": "code", + "execution_count": 127, + "id": "813821c4", + "metadata": {}, + "outputs": [], + "source": [ + "# total_precio = df2.groupby(df2.gender).count()\n", + "# print(total_precio)\n", + "# # etiquetas = dfg.unique()\n", + "# # l=list(total_precio['university'].index.sort_values())\n", + "# label =total_precio['age'].sort_values()\n", + "\n", + "# label.index\n", + "# total_precio.age\n", + "# # total_precio['age'].index\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "efd7743e", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "0777de8d", + "metadata": {}, + "outputs": [], + "source": [ + "total_precio = df1.groupby(df1.gender).count()\n", + "\n", + "colors = sns.color_palette('pastel')[0:6]\n", + "# plt.pie(total_precio.columns[0],labels=total_precio.index, colors = colors,\n", + "# autopct='%.0f%%')\n", + "# # plt.title(f\"Inscription by {dfg.name}: {location}\")\n", + "# plt.show()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "4904292f", + "metadata": {}, + "outputs": [], + "source": [ + "total_precio.columns[0]\n" + ] + }, + { + "cell_type": "code", + "execution_count": 129, + "id": "84b7fd47", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "array(['male', 'female'], dtype=object)" + ] + }, + "execution_count": 129, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "904/len(df1)*100\n", + "\n", + "df1.gender.unique()" + ] + }, + { + "cell_type": "code", + "execution_count": 130, + "id": "b70b601c", + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "grafPie(df1,df1.inscmonth,df1.university[0])\n", + "grafPie(df2,df2.inscmonth,df2.university[0])" + ] + }, + { + "cell_type": "code", + "execution_count": 131, + "id": "a64ec8bc", + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "grafPie(df1,df1.age,df1.university[0])\n", + "grafPie(df2,df2.age,df2.university[0])" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "ce384c4f", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "cb71a7d7", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": 132, + "id": "25379fb1", + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "grafBox(df1.career,df1.age,df1.university[0])\n", + "grafBox(df2.career,df2.age,df2.university[0])\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "88cf4a7a", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": 133, + "id": "4aa8f82a", + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "grafBar(df1.career,df1.university[0])\n", + "grafBar(df2.career,df2.university[0])" + ] + }, + { + "cell_type": "code", + "execution_count": 134, + "id": "67043e5b", + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "grafBar(df1.age,df1.university[0])\n", + "grafBar(df2.age,df2.university[0])" + ] + }, + { + "cell_type": "code", + "execution_count": 135, + "id": "ae52cfc5", + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "graf3Rel(df1,df1.career,df1.age,df1.gender)\n", + "graf3Rel(df2,df2.career,df2.age,df2.gender)" + ] + }, + { + "cell_type": "code", + "execution_count": 136, + "id": "db6b1704", + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "grafLocation(df1)\n", + "\n", + "\n" + ] + }, + { + "cell_type": "code", + "execution_count": 137, + "id": "8f18aebc", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "'univ. nacional del comahue'" + ] + }, + "execution_count": 137, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df1.university.unique()[0]" + ] + }, + { + "cell_type": "code", + "execution_count": 138, + "id": "ec149ead", + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "iVBORw0KGgoAAAANSUhEUgAAAmEAAAH+CAYAAADULdlAAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjQuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8rg+JYAAAACXBIWXMAAAsTAAALEwEAmpwYAABKvklEQVR4nO3dd5hkVbX+8e/LACLCEGTwShhABRElOgSBewXTFQMYMKAYUAETQcT006uI14gZMyKKGADjqAgSRUCUGUAyXgSVKIIkyeH9/XF2DzXd1T2DzqldU+f9PE893eec6ppV1T3dq/Zeey/ZJiIiIiIGa4naAURERER0UZKwiIiIiAqShEVERERUkCQsIiIiooIkYREREREVJAmLiIiIqCBJWMQIkXShpO3+xa+dKemfkqYt2qhAkiU9blE/bgyGpNdKOm2A/15+XqITkoRFtETSnyU9Y5D/pu0n2j5lYe47Pj7bf7W9nO37WwswIiLmSRIWMQIkLVk7hsXJony98tpPTo38nYmYRP5zRAzA2HSOpE9KuknSFZJ2GHf9ckm3lWuv7Lm2u6SLy7WLJG1Wzv9Z0rsknQfcLmnJ3tEtSQdI+oGkI8vXni1p43Lt28BM4GdlCvKdktYu00BLlvusJmm2pH9IukzS7j0xHSDpKEmHl8e+UNKsBbwMzynP8QZJB0laQtLS5fE37HnsVSXdIWnGJK/lZK/HuyX9qef8C8e9vqdL+oykG4EDJD2sfD/+Kulvkr4i6eE9X/M8SedKulnSGZI26rk24bWf6olLWknSzyX9vXz/fy5pjZ7r60g6tcR+gqQvSjqiXNtO0lXjHq/3+7yFpN+WOK+V9AVJS08Ry7bl+dws6UpJry3nVyjfz79L+ouk902WQEnaWtJZkm4pH7fuuXaKpA9LOh24A3iMpN16vmeXS9pz3OO9o8R+jaTXjbv2XEnnSLq1xHvAVK91xGLFdm655dbCDfgz8Izy+WuBe4HdgWnAm4BrAAGPAG4FHl/u+2jgieXzlwBXA5uX+z4OWKvn8c8F1gQe3uffPKD8mzsDSwH7A1cAS42/bzleGzCwZDk+FfgSsAywCfB34Gk9j30X8JzyfD4KnDnFa2HgZGBlmuTvj8AbyrUvAR/vue8+wM8meZypXo+XAKvRvLl8GXA78Oie1/8+YC9gSeDhwGeA2SWm5YGfAR8t998UuB7Ysjy/15TX62FTvPbnAa+YJO5HAi8Gli3/1tHAT3qu/xb4JLA0sG35eTiiXNsOuGqKn60nA1uV57U2cDGw7yRxrAXcBuxSfiYeCWxSrh0O/LTEt3b5Hr2+5/U7rXy+MnAT8Kryb+5Sjh9Zrp8C/BV4Yrm+FPBc4LHle/ZUmuRss3L/ZwN/A55E83/huzQ/L4/ref4blu/rRuW+L6j9/zu33BbFrXoAueU2qjcmJmGX9Vxbtvyh+Y/yh+fm8kf64eMe4zhgnyke/3VT/JsH0JMYlT9i1wL/Of6+5XjtEtOSNMnF/cDyPdc/Cnyz57FP6Lm2AXDnFK+FgWf3HL8ZOLF8vmX5o61yPAd46SSPM+nr0ee+5wI79bz+f+25Jpok7bE9554CXFE+/zLwoXGPdynw1Mle+4f4s7EJcFP5fCZNgrhsz/UjWMgkrM9j7wv8eJJr7+l3jSbRvAfYoOfcnsApPa/fWBL2KuD3477+t8Bry+enAAcu4Pn/ZOz7CHwD+FjPtfXoScL6fO1ngc/8q699brkN0y3TkRGDc93YJ7bvKJ8uZ/t2mpGbNwLXSvqFpPXL9TWBP03xmFcu4N+cd932A8BVNKNFC7Ia8A/bt/Wc+wuwes/xdT2f3wEss4Bpud5Y/zIWh+3fla/frjzvx9GMUPUz6esh6dU904c304ysrDLJvz+DJhGe23P/Y8t5aEaM3j52rVxfk/lfuwW99r2xLSvpq2Wa71aaUcYV1axEHXut7+j5kofy2OuV6c3rymN/hPmfd6/JXr9VaEas/tJzbvz3e8xq4+7X777zxS9pB0lnlqnnm2lGUMdiXI2JPxu9X7ulpJPLNOktNP9PJnt+EYuVJGERQ8D2cbafSTMVeQlwSLl0Jc00zqRfuoCHXnPsk1LfswbNNOiCvvYaYGVJy/ecm0kzFfivWrPn85k9cQB8C9iVZpTlB7bvmuQx+r4ektaiec3eSjMttiJwAc2I15je53sDcCfNtO+K5baC7eV6/p0P91xb0faytr83yeMtyNuBxwNb2p4O/NdY6DSjkytLWrbn/r2v1e00CePYc53Gg8kiNKN2lwDrlsf+f+Oed6/Jfp5uoJm6Xqvn3GTf72vG3a/ffee9NpIeBvyQZrr1UeV7c0xPjNcy8Wej13dpkvI1ba8AfIXJn1/EYiVJWERlkh4laSdJjwDuBv4JPFAufx3YX9KT1XhcSTgW1pMlvaiMUO1bHv/Mcu1vwGP6fZHtK4EzgI9KWqYUpb+eZprsX/WOUqC+Jk3d15E9144AXkiTiB0+xWNM9no8guYP/98BJO1GMxLWVxkVPAT4jKRVy9esLum/y10OAd5YRmEk6RGlQHz5yR5zAZanSfpulrQy8IGeWP5CMwV7gJqFCk8Bnt/ztX+kGWV8rqSlgPcBDxv32LcC/ywjiW+aIo7vAM+Q9FI1CzkeKWkTN9uSHAV8WNLy5TXdj/7f72OA9SS9ojzGy2imo38+yb+5dIn378B9ahakPKvn+lHAayVtUBLRD4z7+uVpRgrvkrQF8Iopnl/EYiVJWER9S9D8wbsG+AdN4fKbAGwfDXyYZjTgNppampUfwmP/lGaqc6yQ+kW27y3XPgq8r0y37d/na3ehqRO7Bvgx8AHbJzyUJ9Ynlrk0tVq/AA4du1CSvrNpEqnfTPYAk70eti8CPkVTm/Q3mkLu0xcQz7uAy4AzyzTeCTSjVdieQ7OI4gs0r91lNHVRk1KzQvSVk1z+LM1igBtokuBjx11/JU1N2o3A/9IkqHeXWG6hqaH7Os1o0+0008pj9qdJTG6jSR57k9v52P4rzVTg22l+1s4FNi6X9yqPfTlwGs1r/I0+j3Ej8LzyGDcC7wSeZ/uGSf7N24C9aZKtm0qss3uu/5Lm9TmJ5nU+adxDvBk4UNJtwPvL40SMhLFC2IgYMWUp/+Ns71o7loUh6RvANbbfVzuW2iQdCVxie/yoUESMkGwyGBHVSVobeBHN1hCdI2lzmpGpK2im6nYCPlY1qIhoXaYjI6IqSR+iKaI/yPYVteOp5D9otnb4J/B54E22z6kaUUS0LtORERERERVkJCwiIiKigiRhERERERUsdoX5q6yyitdee+3aYUREREQs0Ny5c2+wPaPftcUuCVt77bWZM2dO7TAiIiIiFkjS+DZf82Q6MiIiIqKCJGERERERFSQJi4iIiKggSVhEREREBUnCIiIiIipIEhYRERFRQZKwiIiIiApaS8IkfUPS9ZIumOS6JH1e0mWSzpO0WVuxRERERAybNkfCvgk8e4rrOwDrltsewJdbjCUiIiJiqLSWhNk+FfjHFHfZCTjcjTOBFSU9uq14IiIiIoZJzZqw1YEre46vKuciIiIiRt5i0TtS0h40U5bMnDmz732e/I7DBxlSa+Ye9OqHdP+/HrhhS5EM1sz3n/+Q7r/Nwdu0FMlgnb7X6Q/p/r/+r6e2FMlgPfXUXz+k+3/h7T9rKZLBeuunnv+Q7v/hXXduKZLBeu8RP3hI97/4wye1FMlgPeG9T3tI9z/ggAPaCWTAHurzOOroLdoJZMBe+pLfP+SvqTkSdjWwZs/xGuXcBLa/ZnuW7VkzZvRtRB4RERGxWKmZhM0GXl1WSW4F3GL72orxRERERAxMa9ORkr4HbAesIukq4APAUgC2vwIcAzwHuAy4A9itrVgiIiIihk1rSZjtXRZw3cBb2vr3IyIiIoZZdsyPiIiIqCBJWEREREQFScIiIiIiKkgSFhEREVFBkrCIiIiICpKERURERFSQJCwiIiKigiRhERERERUkCYuIiIioIElYRERERAVJwiIiIiIqSBIWERERUUGSsIiIiIgKkoRFREREVJAkLCIiIqKCJGERERERFSQJi4iIiKggSVhEREREBUnCIiIiIipIEhYRERFRQZKwiIiIiAqShEVERERUkCQsIiIiooIkYREREREVJAmLiIiIqCBJWEREREQFScIiIiIiKkgSFhEREVFBkrCIiIiICpKERURERFSQJCwiIiKigiRhERERERUkCYuIiIioIElYRERERAVJwiIiIiIqSBIWERERUUGSsIiIiIgKkoRFREREVJAkLCIiIqKCJGERERERFSQJi4iIiKggSVhEREREBUnCIiIiIipoNQmT9GxJl0q6TNK7+1yfKelkSedIOk/Sc9qMJyIiImJYtJaESZoGfBHYAdgA2EXSBuPu9j7gKNubAi8HvtRWPBERERHDpM2RsC2Ay2xfbvse4PvATuPuY2B6+XwF4JoW44mIiIgYGku2+NirA1f2HF8FbDnuPgcAv5K0F/AI4BktxhMRERExNGoX5u8CfNP2GsBzgG9LmhCTpD0kzZE05+9///vAg4yIiIhY1NpMwq4G1uw5XqOc6/V64CgA278FlgFWGf9Atr9me5btWTNmzGgp3IiIiIjBaTMJOwtYV9I6kpamKbyfPe4+fwWeDiDpCTRJWIa6IiIiYuS1loTZvg94K3AccDHNKsgLJR0oacdyt7cDu0v6A/A94LW23VZMEREREcOizcJ8bB8DHDPu3Pt7Pr8I2KbNGCIiIiKGUe3C/IiIiIhOShIWERERUUGSsIiIiIgKkoRFREREVJAkLCIiIqKCJGERERERFSQJi4iIiKggSVhEREREBUnCIiIiIipIEhYRERFRQZKwiIiIiAqShEVERERUkCQsIiIiooIkYREREREVJAmLiIiIqCBJWEREREQFScIiIiIiKkgSFhEREVFBkrCIiIiICpKERURERFSQJCwiIiKigiRhERERERUkCYuIiIioIElYRERERAVJwiIiIiIqSBIWERERUUGSsIiIiIgKkoRFREREVJAkLCIiIqKCJGERERERFSQJi4iIiKggSVhEREREBUnCIiIiIipIEhYRERFRQZKwiIiIiAqShEVERERUkCQsIiIiooIkYREREREVJAmLiIiIqCBJWEREREQFScIiIiIiKkgSFhEREVFBkrCIiIiIClpNwiQ9W9Klki6T9O5J7vNSSRdJulDSd9uMJyIiImJYLNnWA0uaBnwReCZwFXCWpNm2L+q5z7rAe4BtbN8kadW24omIiIgYJm2OhG0BXGb7ctv3AN8Hdhp3n92BL9q+CcD29S3GExERETE02kzCVgeu7Dm+qpzrtR6wnqTTJZ0p6dktxhMRERExNFqbjnwI//66wHbAGsCpkja0fXPvnSTtAewBMHPmzAGHGBEREbHotTkSdjWwZs/xGuVcr6uA2bbvtX0F8EeapGw+tr9me5btWTNmzGgt4IiIiIhBaTMJOwtYV9I6kpYGXg7MHnefn9CMgiFpFZrpyctbjCkiIiJiKLSWhNm+D3grcBxwMXCU7QslHShpx3K344AbJV0EnAy8w/aNbcUUERERMSxarQmzfQxwzLhz7+/53MB+5RYRERHRGdkxPyIiIqKCJGERERERFSxUEibpxIU5FxERERELZ8qaMEnLAMsCq0haCVC5NJ2JG69GRERExEJaUGH+nsC+wGrAXB5Mwm4FvtBeWBERERGjbcokzPbngM9J2sv2wQOKKSIiImLkLdQWFbYPlrQ1sHbv19g+vKW4IiIiIkbaQiVhkr4NPBY4F7i/nDaQJCwiIiLiX7Cwm7XOAjYom6tGRERExL9pYfcJuwD4jzYDiYiIiOiShR0JWwW4SNLvgbvHTtrecfIviYiIiIjJLGwSdkCbQURERER0zcKujvx124FEREREdMnCro68jWY1JMDSwFLA7bantxVYRERExChb2JGw5cc+lyRgJ2CrtoKKiIiIGHULuzpyHjd+Avz3og8nIiIiohsWdjryRT2HS9DsG3ZXKxFFREREdMDCro58fs/n9wF/ppmSjIiIiIh/wcLWhO3WdiARERERXbJQNWGS1pD0Y0nXl9sPJa3RdnARERERo2phC/MPA2YDq5Xbz8q5iIiIiPgXLGwSNsP2YbbvK7dvAjNajCsiIiJipC1sEnajpF0lTSu3XYEb2wwsIiIiYpQtbBL2OuClwHXAtcDOwGtbiikiIiJi5C3sFhUHAq+xfROApJWBT9IkZxERERHxEC3sSNhGYwkYgO1/AJu2E1JERETE6FvYJGwJSSuNHZSRsIUdRYuIiIiIcRY2kfoU8FtJR5fjlwAfbiekiIiIiNG3sDvmHy5pDvC0cupFti9qL6yIiIiI0bbQU4ol6UriFREREbEILGxNWEREREQsQknCIiIiIipIEhYRERFRQZKwiIiIiAqShEVERERUkCQsIiIiooIkYREREREVJAmLiIiIqCBJWEREREQFScIiIiIiKkgSFhEREVFBkrCIiIiIClpNwiQ9W9Klki6T9O4p7vdiSZY0q814IiIiIoZFa0mYpGnAF4EdgA2AXSRt0Od+ywP7AL9rK5aIiIiIYdPmSNgWwGW2L7d9D/B9YKc+9/sQ8HHgrhZjiYiIiBgqbSZhqwNX9hxfVc7NI2kzYE3bv2gxjoiIiIihU60wX9ISwKeBty/EffeQNEfSnL///e/tBxcRERHRsjaTsKuBNXuO1yjnxiwPPAk4RdKfga2A2f2K821/zfYs27NmzJjRYsgRERERg9FmEnYWsK6kdSQtDbwcmD120fYttlexvbbttYEzgR1tz2kxpoiIiIih0FoSZvs+4K3AccDFwFG2L5R0oKQd2/p3IyIiIhYHS7b54LaPAY4Zd+79k9x3uzZjiYiIiBgm2TE/IiIiooIkYREREREVJAmLiIiIqCBJWEREREQFScIiIiIiKkgSFhEREVFBkrCIiIiICpKERURERFSQJCwiIiKigiRhERERERUkCYuIiIioIElYRERERAVJwiIiIiIqSBIWERERUUGSsIiIiIgKkoRFREREVJAkLCIiIqKCJGERERERFSQJi4iIiKggSVhEREREBUnCIiIiIipIEhYRERFRQZKwiIiIiAqShEVERERUkCQsIiIiooIkYREREREVJAmLiIiIqCBJWEREREQFScIiIiIiKkgSFhEREVFBkrCIiIiICpKERURERFSQJCwiIiKigiRhERERERUkCYuIiIioIElYRERERAVJwiIiIiIqSBIWERERUUGSsIiIiIgKkoRFREREVJAkLCIiIqKCJGERERERFSQJi4iIiKig1SRM0rMlXSrpMknv7nN9P0kXSTpP0omS1moznoiIiIhh0VoSJmka8EVgB2ADYBdJG4y72znALNsbAT8APtFWPBERERHDpM2RsC2Ay2xfbvse4PvATr13sH2y7TvK4ZnAGi3GExERETE02kzCVgeu7Dm+qpybzOuBX7YYT0RERMTQWLJ2AACSdgVmAU+d5PoewB4AM2fOHGBkEREREe1ocyTsamDNnuM1yrn5SHoG8F5gR9t393sg21+zPcv2rBkzZrQSbERERMQgtZmEnQWsK2kdSUsDLwdm995B0qbAV2kSsOtbjCUiIiJiqLSWhNm+D3grcBxwMXCU7QslHShpx3K3g4DlgKMlnStp9iQPFxERETFSWq0Js30McMy4c+/v+fwZbf77EREREcMqO+ZHREREVJAkLCIiIqKCJGERERERFSQJi4iIiKggSVhEREREBUnCIiIiIipIEhYRERFRQZKwiIiIiAqShEVERERUkCQsIiIiooIkYREREREVJAmLiIiIqCBJWEREREQFScIiIiIiKkgSFhEREVFBkrCIiIiICpKERURERFSQJCwiIiKigiRhERERERUkCYuIiIioIElYRERERAVJwiIiIiIqSBIWERERUUGSsIiIiIgKkoRFREREVJAkLCIiIqKCJGERERERFSQJi4iIiKggSVhEREREBUnCIiIiIipIEhYRERFRQZKwiIiIiAqShEVERERUkCQsIiIiooIkYREREREVJAmLiIiIqCBJWEREREQFScIiIiIiKkgSFhEREVFBkrCIiIiICpKERURERFSQJCwiIiKigiRhERERERW0moRJerakSyVdJundfa4/TNKR5frvJK3dZjwRERERw6K1JEzSNOCLwA7ABsAukjYYd7fXAzfZfhzwGeDjbcUTERERMUzaHAnbArjM9uW27wG+D+w07j47Ad8qn/8AeLoktRhTRERExFBoMwlbHbiy5/iqcq7vfWzfB9wCPLLFmCIiIiKGgmy388DSzsCzbb+hHL8K2NL2W3vuc0G5z1Xl+E/lPjeMe6w9gD3K4eOBS1sJesFWAW5Y4L1GT553t+R5d0ued7fkeQ/eWrZn9LuwZIv/6NXAmj3Ha5Rz/e5zlaQlgRWAG8c/kO2vAV9rKc6FJmmO7Vm14xi0PO9uyfPuljzvbsnzHi5tTkeeBawraR1JSwMvB2aPu89s4DXl852Bk9zW0FxERETEEGltJMz2fZLeChwHTAO+YftCSQcCc2zPBg4Fvi3pMuAfNIlaRERExMhrczoS28cAx4w79/6ez+8CXtJmDItY9SnRSvK8uyXPu1vyvLslz3uItFaYHxERERGTS9uiiIiIiAqShEVERERUkCQsIuaRtISk6bXjGARJj5C0RPl8PUk7SlqqdlzRDkn7SJquxqGSzpb0rNpxRTskPVbSw8rn20naW9KKlcOaIEnYQpC0qqSZY7fa8bRN0osk/Z+kWyTdKuk2SbfWjmtQJD1X0jslvX/sVjumNkn6bvnj9AjgAuAiSe+oHdcAnAosI2l14FfAq4BvVo1oACRtJeksSf+UdI+k+zvy//t1tm8FngWsRPP9/ljdkAZH0saS3lpuG9eOZwB+CNwv6XE0RflrAt+tG9JEScKmUN4Z/x9wBfBr4M/AL6sGNRifAHa0vYLt6baXt92V0ZGvAC8D9gJEs3p3rapBtW+D8sfpBTQ/3+vQ/IEadbJ9B/Ai4Eu2XwI8sXJMg/AFYBfg/4CHA28Avlg1osEY60v8HODbti/sOTfSJO0DfAdYtdyOkLRX3aha90Bph/hC4GDb7wAeXTmmCZKETe1DwFbAH22vAzwdOLNuSAPxN9sX1w6ikq1tvxq4yfYHgacA61WOqW1LlWm4FwCzbd8LdGHZtCQ9BXgl8ItyblrFeAbG9mXANNv32z4MeHbtmAZgrqRf0SRhx0laHnigckyD8nqaloDvL9tEbQXsXjmmtt0raReaDeF/Xs4NXblBq/uEjYB7bd9Y6mSWsH2ypM/WDmoA5kg6EvgJcPfYSds/qhbR4NxZPt4haTWaNlpD9+5pEfsqzSjvH4BTJa0FdGF6al/gPcCPy0bSjwFOrhvSQNxRupicK+kTwLV04w3564FNgMtt3yHpkcBudUMaGAH39xzfz+iPAu4GvBH4sO0rJK0DfLtyTBNkn7ApSDqBZnTgozTNP68HNre9dc242ibpsD6nbft1Aw9mwCT9D3AwzajnF2lGhL5u+3+qBjZgkpYsQ/kjT9KyZVqyE0qSfT3NqMDbaHr2fqmMjo00SSsB6wLLjJ2zfWq9iAZD0n40I0I/LqdeAHzT9mdrxTQIkh4OzLR9ae1YJpMkbAqlUPkumncMr6T5ZfUd2xOajMfiS9L6ti/pc/5hwDK2b6kQ1kBJei5NPVTvH6cD60XUvjIVeSiwnO2ZpVh5T9tvrhzaIifpjcD5tk+vHUstkt4A7AOsAZxLMyX3W9tPqxnXoEjaDNi2HP7G9jk142mbpOcDnwSWtr2OpE2AA23vWDey+SUJiwkkrUEzGrRNOfUbYB/bV9WLqj2SdqIpRN8NeGa/+4zyVGxZjLAssD3wdWBn4Pe2X181sJZJ+h3Nc51te9Ny7gLbT6ob2aInaQXg88DRNCP7E37x295o0HENkqTzgc2BM21vIml94CO2X1Q5tNZImm77Vkkr97tu+x+DjmlQJM0FngacMsz/v1MT1oek02xvK+k25v9lJZppuZFbKVjeKf+mrBg6jGYp71hfz13Lub4JyuLO9k8lXU5TnPycfncBRjYJo1mMsJGk82x/UNKn6MYqYGxfKc1XGnP/ZPddnJXR3NdIWhV4Xu14KrnL9l2SkPQw25dIenztoFr2XZrv91z6/C0DHlMjqAG51/Yt4/5/D91CjCRhfdjetnxcvnYsA3Q4zejX64FVy4qpMd+UtG+VqAbE9vnA+TQjBV3TxcUIAFdK2hpwWR26DzDqq4JvBE6wvX3tQCq4qmzW+RPgeEk3AX+pGlHLbD9PTRbyVNt/rR3PgF0o6RXANEnrAnsDZ1SOaYIkYVOQtBVwoe3byvHyNHsq/a5uZIteWS20Rzm8QdKuwPfK8S40v7xHXvkl/WpgbXr+f9jeu1JIg/Dz8rwPAs6mLEaoGtFgvBH4HLA6cDXNhq1vqRpRy2zfL+kBSSt0odaxl+0Xlk8PkHQyTY3vsRVDGgjblvQLYMPasQzYXsB7aVb4fxc4jmbbqaGSmrApSDoH2MzlRVLT4mSO7c3qRtausnrqYJo9skzz7mHvLryTknQGzV5w59MzdG37W9WCGqAuLUboKkk/BTYFjgduHzs/4m80+r2png48YRTfVI8n6VvAF2yfVTuWQZH0EttHL+hcbUnCpiDpXNubjDt33qgXsHaZpLNHPckeI+lptk+S1LcweVQXI0g6mCk2o+1AMvKaPqdt+/CBBzNAXX1TDSDpEuBxNNOvt/NgffPI/i3r97t8GH+/ZzpyapdL2hv4cjl+M3B5xXhaJemdtj8x2R+pUf/jVHxb0u40Oyz3blQ7iquIngqcBDy/z7VRXowwp3YAla1o+3O9J0pbm1En94w62H5AUlf+Bv537QAGRdIONAusVpf0+Z5L04Gh2/swI2FTKCuJPk+zzNXAicC+tq+vGlhLJD3f9s8meafciSk5SW8BPgzczIOJqG2P5CqiMhqws+2jascSgzHJCME5Y8v4R5WkHwGnMP+b6u1tv6BWTINW/qb17gU4ciUmZb+/TYADgff3XLoNONn2TTXimkySsIgeZauKLWzfUDuWQZE0x/as2nEMmqQZwLuADZj/D9NIbt5Z+ui9gmbDzt/0XFqeptnx06sENiBde1PdS9KOwKeA1Wi6JawFXGx7JBvWS5pG06T9FbVjWZCuDMX+SyQtQ7Nlw/idxEe6fY+k44GX2L65HK8EfN92F4a0LwM608KmOEHS/sCRzF+oPYpTsL2+Q/Ocn0uzUvI1wN+rRtSuM2j6RK5C8wd5zG3AeVUiGqCSbL28dhyVfIimQ8AJtjeVtD3N/o8jqawCXlPS0rbvqR3PVJKETe3bwCU08+kH0rQuGvV9hABmjCVgALZvKu8iu+B2msbGJzN/Tdgo18O9rHzs3Z5h1DdyBHik7UMl7WP718CvJY3s6jHbf6EpzH5K7VgGKbWuQLNx6Y2SlpC0hO2TJX22dlAtuwI4XdJs5n9z+el6IU2UJGxqj7P9Ekk72f6WpO8y/zD+qLpf0syxeoGyZUVX5q1/Um6dYXud2jFUcm/5eG3pnXkN0Le9yygpWzUcDDwBWBqYBtw+ip1AirE3zl1ekHGzpOWAU4HvSLqensRkRP2p3JagmXIfSqkJm4Kk39veQtKpNEWc19H01BvpEQJJzwa+BvyaZinzfwJ72D6uamADImlpYL1yeKnte6e6/yiQ9CQm1kaN+pYFz6N5U7UmTVIyHTjA9s+qBtYySXNopuWOBmbRbE68nu33VA0sWiPpEcBdNL/PX0mzUe13bHdiE+5hliRsCpLeAPwQ2Iimd+JywPttf6VqYAMgaRWaGgJoGt52olBd0nbAt4A/0/zCWhN4je1T60XVLkkfALajScKOAXYATrO9c8242iZpG9unL+jcqBlbiNG752FHVkf+jIkj+rfQjJB91fZdg48q2lIW3ryTiTXdQ7XwJklY9FWK8ddl/h/ekU1ExkiaC7zC9qXleD3ge7afXDey9kg6H9gYOMf2xpIeBRxheyQbto9ZXDZzXNTKyP4zaFpTXUdTrP9a2xtXDaxlkj4HzODBdmwvA26lScym235VrdjaJuk2HkxAlwaWYrSnoJH0K5qFN/vTs/DG9ruqBjZOasKm0NE+gmMjgPsAawDn0oyI/ZZmafeoW2osAQOw/cfS3HmU3Vk2rryvtHK5nmYEcCRJegqwNTBD0n49l6bT1EeNulfRPM+3Am+j+V6/uGpEg7G17c17jn8m6Szbm0u6sFpUA2B7Xk2UJAE78eBMx6haLBbeJAmb2jH06SPYAfsAm9NMQ24vaX3gI5VjGpQ5kr4OHFGOX8noF/TOKW84DgHmAv+kSbpH1dI0pQVLMn/B7q3ASE/BwrxVkgB3Ah+sGcuALTduwdFMmp8DgKHexmBRKl0DflLKEN5dO54WLRYLbzIdOYUuTE300/Pu8FxgS9t3S7pwVDf261UaWL+FZkNLaAq3v2T77sm/anRIWptmambk942StFZPQjLyJB1l+6Vl+rnfVg0j20cQQNJzgK/QrJgTsA7NgqtTgN1tf7ZacC0b1x92CZoFGU+1PbLblUyy8OaDtmdXDWycJGFTkPQ2mlGBLvQRnEfSj4HdgH1ppiBvopmme07NuKI9klan2UW7d9p9pGsAS73f/kwsNxjJaXdJj7Z9bdlyZoIuJKTlTdb65fDSrhTjSzqs5/A+moVHh3ShW8CwSxI2ha71EexH0lNpljMfO+w7Dy8KkrYBDmBiQjKy33NJH6cpUr4IuL+ctu0d60XVPkl/oBkZmcuDzxvbc6sFNQBlu4KxOsD1aJKSX476ViyltvNNwH+VU6fQrIoc6ecN3V0JvDhIEjaFjvYRnAZcaHv9Bd55BEm6hKZYefwf5pHdT0fSpcBGXZlyHSNp7iivep1MWQH8n8BKwOnAWcA9tl9ZNbAWlJ6Jp9i+tdR6LkWzBQ00CxTut/2GagEOSFdXAi8OUpg/tc71ESw9ty7tLWDtmFts/7J2EAN2Oc0fp04lYTSr494M/JgOlRvQvPm+Q9LraeodP1HqP0fRJcCXaRbYbD5uG46TymjoyMpK4OGXJGxqXewjCM075Asl/Z75e26N9PRUcbKkg4AfMf/3/Ox6IbXuDpqf8xPp1s/5a8rHd/Sc60LPTJU/zq8EXl/OjeQf5LLFzP7l8H5Jj7X9JwBJj6FntHtEdXYlcKn/ezETaz4PrBVTP0nCpvYTOtZHsPif2gFUtGX5OKvnnBntPdJml1undLhn5r7Ae4Af276wJCMn1w2pPbavLZ++g+ZN1uU0qyPXolmANLJ69sf6ZhcWXozzU5qOCHMZ4lH+1IRNotRGnWB7+9qxDJqkj4/fVbjfuYjFmaRlgf2Ambb3kLQu8HjbP68cWrSkjI48vhxe2pU6SEnHAy+xfXM5Xgn4vu3/rhpYiyRdYPtJteNYkIyETaLURj0gaQXbt9SOZ8CeCYxPuHboc27kSFoB+AAPrqD6NXDgKP4MdH3fKJp+sHNpamYArqZpaj2SSZikz9red5IeiiNbbjBuj6xej5OE7R8NNKA6VhlLwABs3yRp1YrxDMIZkja0fX7tQKaSJGxq/wTOL+8iemujRrJWRtKbaDYvfKyk3s06l6dZRdUF3wAuAF5ajl9F88d6sl/ki7N9ysfnVY2insfafpmkXQBKsbpqB9Wiw8vHT1aNYvCeP8U109R/jroHxnULWJs+ifiI2RZ4raQraKYjRbP1zlC9uUwSNrUf0Y3/oGO+C/wS+Cjzt7O4rQMrxsY81nZvH70PjurKsbJx5zTgm12cdgfukfRwyh8jSY9liGtHFoGDgKcDz+lSaYHtka77WkjvBU6T9GuaZOQ/gT3qhtS6HWoHsDCShE3B9rcWfK/RUabcbpH0PuC60q5oO2AjSYf3DmePsDslbWv7NJi3eeudlWNqTcen3T8AHAusKek7wDbAa6tG1K5HS9oa2FHS92n+GM8z4iuAO1VqMJ7tYyXNokm8zqFZcDayv9eg6QAhaVtgXduHSZrBg71Ch0YK86dQCnU/CmwALDN2fpR3TwcoIz+zaJb2HkOzyuSJXWhbJGljmmmbFcqpm4DXjHIvRUk/BTYFOjHt3kvSI4GtaBKSM0d5Y2ZJO9NsSbEtzQatvUmYR7Vd0xhJP6QpNejdrHVj26NYajAfSW+gKT9YAziX5mf+t6P8PS8NymfRLLZZT9JqwNG2t6kc2nwyEja1w2jeOX0G2J5mOfMSVSMajAds31cKWg+2fbCkc2oH1bYyNfcq2xtLmg5g+9bKYQ1Cp6bdJa1v+xJJY7uFj21hMLPUzYzkiJDtHwA/kPQ/tj9UO54KOlNq0Mc+wOY0bzS2l7Q+8JHKMbXthTRvLs8GsH2NpOWn/pLBSxI2tYfbPlGSyh4rB5SWH++vHVjL7i3Fyq/mwaLWpSrGMxBlam7b8nkXki+gmXYvtVEzbV9aO54B2I9mWuZTfa6N+p5wdDQBg46VGoxzl+27JCHpYeVNyOMX/GWLtXtsW9JYzecjagfUT5Kwqd0taQng/yS9lWYJ+9DNKbdgN+CNwIdtXyFpHeDblWMalHMkzabZqqB3am5kR4okPZ9mxdzSwDqSNqGplRnJLQts71E+dnExQpe9CfhWqQ0T8A9Guwaw11WSVqSpBTte0k3AqG/eepSkrwIrStodeB1wSOWYJkhNWB+Svm37VZLeCXwJWBH4EE2d0Cdsn1kzvmiPpMP6nLbt1w08mAEpo7tPo2l0vGk5t1hsdPjvkLQMzZYs29KMgP0G+Irtu6oGFq3qWKnBBJKeSvO37Fjb99SOp02Sngk8iybpPs728ZVDmiBJWB+SLgKeQbNdw3ZMXEU0kts1ZPPObpJ0pu2tJJ3Tk4SdN+rfb0lHAbcBR5RTrwBWtP2SelG1T9KngG/YvrB2LIMgaVfbR2j+Btbz2P70oGOKGJPpyP6+ApxI08h3LmWTt56Po7o6suubdyLp831O3wLMsf3TQcczIBdKegUwrawI3hs4o3JMg/Ak2xv0HJ9c3oCNuouBr0lakmbx0fdGfJuGsVqgoSvKjshI2BQkfdn2m2rHEYMj6WvA+jQ1YQAvBq4AHglcbnvfSqG1pvRQfC/NsD3AccCHRr2vnqQjgC+MlRdI2hJ4i+1X141sMEph9m7ALjQdMQ6xPbKNvCOGUZKwmKBsTfFxYFWa0b+xdg/TqwY2AJLOBLaxfX85XpKmVmhb4PxxIycjQdJLbB+9oHOjome6fSmaZs5/LZdmApeM4vd4vLIdy/NokrA1gaNofsZvt/3ymrG1RdJjgM/R7JFl4LfA22xfXjWw6LQkYTGBpMuA59u+uHYsgybpUmCLsemZspLq97Yf31szNUoknW17swWdGxWS1prqetmOZmRJ+gxNAnYScKjt3/dcu9T2SG5dUN5gfRH4Xjn1cmAv21vWiyrasrhstp6asOjnb11MwIpPAOdKOoVmBPC/gI+UPWZOqBnYoiZpB+A5wOrjauGmA/fViap9vUmWpJVoRoJ6fxeOdBIGnAe8z/btfa5tMehgBmhZ271b7Rwh6R3Voom2LRabrWckLCaQ9DngP2j2lJlXFzTKe2X1Ku0tXkVTwLwccJXtU+tGteiVFk2bAAcy/wbEtwEn276pRlyDIulDNPtE/YkHVwOPfPuerpG0cvn0XTRtyL5P8/1+GbCS7ffUii3aI2mu7SdLOt/2hr3nasfWK0lYTNDFvbLGdLTH2lI0I0Fd2TEfmDf1vOGo75XUdZKu4MHV7eN52KanYtGQdAZNneMPaKberwY+NmzT7UnCInqUou2xHmubjPVYG+Umv7075tse+R3zx5SGzm+yfX3tWCJi0ZK0Oc1sxoo0m61PBw4ats3WUxMW80h6p+1PSDqY/pu17l0hrEHrYo+1A2hqgU4BsH1uaVU16j5K06bqAuafdh/p5HOMpFWZv2D5r1PcPWKxUVb/vsz2/sA/aerBhlKSsOg1Vow/p2oUdXWxx9q9tm+R5m8MUSuYAfoWzVYs5wMPVI5lYCTtSNO8fDXgemAtmv/7T6wZV8SiYvt+SdvWjmNhZDoyYhJd6bEm6VCaDhHvptmcdm9gKdtvrBpYyySdZXvz2nEMmqQ/0PQKPcH2ppK2B3a1/frKoUUsMpK+DKxOs/H2vJXAw7bALElYTCBpFs0O6mvRM1o66r0Eu2qSHfP/d9QbWUv6NM005Gzmn448u1pQAyBpju1ZJRnb1PYDkv5ge+PasbVJ0jbAubZvl7QrsBnwuVHfF66rFpcFZknCYoKyauwdjJumyS+r0SRps1FPPPqR1K9Fz8hvUSHpBOAFNDVxq9BMSW5ue+uacbVN0nnAxsBGwDeBrwMvtf3UmnFFtyUJiwkknWZ7sZhPj39fSUb+g2Yp95G2L6gcUixikuTyy75sPHwXzZYNr6SZcv+O7Rsrhti6sS4Qkt4PXG370FHuDNF1ZSSs3wKzjITFcJP0dJqmvifSwc1au0jSfwAvpdnAcjpNMva/daNqn6Tn0hSk964SPLBeRO2QtA9wre2jasdSi6RfA8fSrJT7L5oRwD+MbeQZo0XSi3sOlwFeCFwzbKv8k4TFBJKOANYHLuTB6cihm0uPRU/ShsA7aZZ3L107njZJ+gqwLE1Lk68DO9P0CR25AvXSiP5A4ALgq8w/QiCa/9/Ta8Q2KOWNxiuAs2z/RtJMYDvbh1cOLQZA0hLAacM27Z4kLCYY5Sa+MZGkJ9CMgL0YuBE4EvjhqG9iKuk82xv1fFwO+KXt/6wdW1skLTPqCy4i+in7Pf7C9uNqx9Ir+4RFP2dI2sD2RbUDiYH4Bk0/vf+2fU3tYAbozvLxjtIv9Ebg0RXjaV3ZiHjlPpdus33vwAMaIElbAQcDTwCWBqYB/7S9QtXAohWSbmP+Ed/raPqHDpUkYdHPVsC5pefa3Tw4XZEtKkaQ7afUjqGSn5eNeQ8Czqb5hX1I1YgG42xgTZpm1qJp63KdpL8Bu9ueWzG2Nn0BeDnNvlGzgFcD61WNKFpje/naMSyMTEfGBJLW6nc+W1TEqJL0MGAZ27fUjqVtkg4BfmD7uHL8LJqp6MNo9s3asmZ8benZH+28sTeUks6xvWnt2GLRk3Si7acv6FxtGQmLeXqmKW6rGkjEgNm+m56VwCNuK9u7jx3Y/pWkT9resySjo+oOSUvTjPJ/ArgWWKJyTLGISVqGZsHNKpJWohnthWbV9+rVAptEkrDoNZdmSkbATOafrvgr0IWmzp1WVhAtZ/vW2rFEa66V9C6aOkBoFmX8rTQ9HuUemq+iqQN7K/A2minZF0/5FbE42hPYl6Y36lweTMJupZmSHiqZjowJynTFj20fU453AF5ge8+6kUUbJH0XeCNwP3AWzTvGz9k+qGpg0QpJqwAfAMY2ZD4d+CBwCzDT9mW1YotYVCTtZfvg2nEsSJKwmEDS+eM3MOx3LkaDpHNtbyLplTT99N4NzB31hRhd7yUoaXmaBTf/rB1LmyQdZfulks6n/w7qI/1z3mWSngRswPybMQ/VvnCZjox+rpH0PuCIcvxKoEtbF3TNUpKWoukn+AXb90rqwruzLwMbS9oYeDvNhq2HAyPdS7BsyHs4sHI5vgF4zQi3q9qnfHxe1ShioCR9ANiOJgk7BtgBOI3mZ39opCgx+tkFmAH8uNxWLediNH0V+DPwCODUsjq2CzVh95V+ijvRJJ9fBBaLZe3/pq8C+9ley/ZaNAno1yrH1Brb15ZPlwD+ZvsvZbTzeh6sF4rRszPwdOA627vRNG8fuj3hMh0ZERNIWtL2fbXjaFNXewlK+oPtjRd0btRImgNsbfuecrw0cLrtzetGFm2Q9HvbW0iaS9Oa7DbgYtvrVw5tPpmOjAkkzaDpHzi+sfHTqgUVrerXyJqm1+AoexlNL8HX276u9BLswmKEyyX9D/DtcrwrcHnFeAZlybEEDMD2PSURi9E0p2zGfAjNKsl/Ar+tGlEfGQmLCST9iqZ/4P40q+ZeA/zd9tC1fIh/X5caWQeUvZM+yIOrI38DHGD7pnpRtU/S8cDBtmeX452AvYdt885Y9CStDUy3fV7tWMZLEhYTSJpr+8njdpY+K8P2o6mLjawhvQS7RtJjge/Q7B8l4Erg1dmSY7RIWt/2JZI263fd9tmDjmkqmY6MfsYa+V5bpqmuoaykipHUuUbWRad6CUr6GX22aBhje8cBhjNwtv8EbFXeZDDqW3N02H7AHsCn+lwzMFRlNUnCop//lbQCzaqpg2k273xb3ZCiRf0aWX+9akQDYvsySdNs3w8cJukc4D2142rJJ2sHUFNpyfRiYG1gSalZGGl71GsfO8X2HuXj9rVjWRiZjoyIeTrWyPpU4Bk0Ced1NL0EXzvqqwRh3srAsVG/S23fO9X9R4GkY2m6Asyl6Q4BgO1+IyaxmJP0FuA7tm8uxysBu9j+UtXAxkkSFtFRkp5m+yRJL+p33faPBh3TIJX90K4HlqIZ6V0B+NKo1whJ2g74Fs3ecKLpofga26fWi6p9ki6w/aTaccRgjHUCGXfuHNubVgqpr0xHRnTXU4GTgOf3uWZgpJOwnvZEd9KsFuyKTwHPsn0pgKT1gO8BT64aVfvOkLSh7fNrBxIDMU2SyobMlAb1Q7clSUbCIqJTut5LsHfV81TnRo2ki4DHAVcAd9OMAnrUn3dXSToIWIumQwTAnsCVtt9eL6qJkoTFBOMLWMfOp4B1NEn6CPCJcbUTb7f9vqqBtUTSo21fW6YjJxj1Bt6SvgE8wPy9YafZfl29qNrX1e93V0lagibxGtsH7njg62URztBIEhYTpIC1W/rVSUg623bffXZGhaR1gGtt31WOHw48yvafqwbWsvIm6y3Mv1nrl2zfXS+qwZC0LbCu7cNKZ5DlbF9RO67oriRhMUEKWLtF0nnA5mN/hEsyMsf2E+tG1q70EuwWSR+g2Q/u8bbXK3viHW17m8qhRQskbQMcQDMluSQPTj8/pmZc46UwP/pJAWu3fAc4UdJh5Xg3mtVzo65TvQS7XgsHvBDYlGYvPGxfI2n5uiFFiw6lWfU834zOsEkSFv1sC7xWUgpYO8D2x8to2FjtxIdsH1czpgH5u6Qdx/USvKFyTG3ap3x8XtUo6rnHtiWNrZZ7RO2AolW32P5l7SAWJNORMUEKWKMLutpLsCQfd9p+oGxPsT5Nr9CR3rBV0v7AusAzgY8CrwO+a/vgqoFFKyR9jKYf7I9oBhOA4esdmSQs+koBa3eUzVo/DqxKk4yMjXxOrxrYgHStl6CkucB/AisBpwNn0YwSvbJqYAMg6ZnAs2h+xo+zfXzlkKIlkk7uc9q2h6p3ZJKwmCAFrN0i6TLg+bYvrh3LIHV1K5axla+S9gIebvsT/XYXj4j2LVE7gBhKLwR2BG6HpoAVSAHr6Ppb1xKw4qfATsB9ND/rY7dRJ0lPodkf7Bfl3LSK8bRK0mnl422Sbu253Sbp1trxRTskPUrSoZJ+WY43kPT62nGNl8L86CcFrN0yR9KRwE+Yv3ZipNsWAWvYfnbtICrYF3gP8GPbF0p6DNBv6mYk2N62fMwbyW75JnAY8N5y/EfgSJpVk0MjI2HRz1GSvgqsKGl34ATgkMoxRXumA3fQ1Mo8v9y6sILuDEkb1g5i0Gz/2vaOwMHl+HLbe1cOq3WSturdkkLS8pK2rBlTtGoV20fRdIfA9n0M4VYVqQmLvlLAGqOuq70Ey1TkoTSLbWZK2hjY0/abK4fWKknnAJv1NHRegmZT4pHuDNFVkk6hqfk8vtRAbgV83PZT60Y2v0xHRl8l6Uri1QFlm4Iv07TseZKkjYAdbf9v5dDatkPtACr5LPDfwGwA23+Q9F9VIxoMuWfUoWzRkb+Bo2s/mp/xx0o6HZgB7Fw3pIkyHRkRh9DUCN0LYPs84OVVIxqAsu/dmsDTyud30JHfibavHHdq6KZpWnC5pL0lLVVu+wCX1w4q2lH2A3sqsDVNI+8nlt9tQ6UTv3AiYkrL2v79uHP3VYlkgMpWLO+iSUABlgKOqBfRwFwpaWvAJRnZH+jC6tg30vxBvhq4CtgS2KNqRNEaSW+hmXK/0PYFwHKShm7KPUlYRNxQdo8fq5XZGbi2bkgD0dWtWN4IvAVYnSYh2aQcjzTb19t+ue1VbT/K9itsX187rmjN7rZvHjuwfROwe71w+st8eEwgaV2ath4bAMuMnR+27vOxyLwF+BqwvqSraQrVd60b0kB0cisW2zfQ7BEWMcqmSZpXByhpGrB05ZgmSBIW/RwGfAD4DLA9sBsZNR1Zti8HnlGSkCVs31Y7pgEZvxXL6+jAViylDdnuTOwU8LpaMUW04FjgyPJ/HJq6sGMrxtNXtqiICSTNtf1kSefb3rD3XO3YYtGRtKvtIyTt1++67U8POqZB6+JWLJLOAH4DzKWnIN/2D6sFFbGIlS1I9gSeXk4dD3zd9lAtQslIWPRzd/kB/j9Jb6WpG1muckyx6I1Nv3WhDqqvjm7Fsqztd9UOYtC62iu0q2w/QLP1zpdrxzKVjITFBJI2p1kttSLwIZod1Q+yfWbNuCIWBUmn2d5W0m2UxQhjl2g2a51eKbSBkPS/wBm2j6kdyyBJOha4hYkjgJ+qFlQscpKOsv1SSecz//9vAIZtM+YkYTGfUrz4cdv7144lBkPSt4B9xlYSSVoJ+FRqhEZTST4fQdMl4F66k3xeYPtJteOIdkl6tO1rJa3V73rZE3BoZDoy5mP7fknb1o4jBmqj8Uu5JW1aMZ6BKG1MLhxbiFD6Cm5g+3d1I2tXhxtZnyFpQ9vn1w4k2mP72vJxqJKtySQJi37OkTQbOJqyhxKA7R/VCylatISklco+OkhamW78bvgy0Ns38PY+50aGpPVtXyKp7/MrO4yPsm2B10rqVK/QrulTZjDvEkM44tuFX7Tx0C0D3Ag8reecgSRho+lTwG8lHV2OXwJ8uGI8g9K1XoL70ewQ368Gysz//30UdbVXaKcsbiO9qQmLCCRtwIN/hE+yfVHNeAZB0o+AU3hw9dSbge1tv6BWTIMgaYmycqz33DK276oV06CUUot1bR9W9ktbzvYVteOK7koSFhNIOoz+q0pSqB0jQ9KqwOdpkk8DJwL7jnorG0nf6P2/XDbpnW376VN82WKv9AqdBTze9nqSVgOOtr1N5dCiw0Z56D3+dT/v+XwZmh5711SKJaIVJdl6ee04Krha0pdsv7mshP0FHegUQPN7bFPgbGh6hZbFGBHVZCQsFqhs3Hqa7a1rxxIR/z5Jn6DZ/+/JwMe6sFu+pN/b3kLS2bY3KyOAv01hftSUfoCxMNYFVq0dRET86yS9aOwG/A7YCjgHcDk36sb3Cj2BbowAxhDLSFhM0GeJ73XAe7rwbjliVJVaz8m4CzWfXewVGsMtSVhEdFJ6CUZEbZmOjAkknbgw5yIWcz8FdgLuo9modewWETEQWR0Z80haBlgWWKWsmlK5NB1YvVpgEe1Yw/azawcREd2VJCx67QnsC6wGzOXBJOxW4AuVYopoS3oJRkRVqQmLCSTtZfvg2nFEtEnSRcDjgE71EuxqLZykdYGPAhvQ7H8IgO3HVAsqOi8jYTGB7YMlPYmJv6wOrxdVxCLX1V6CPwVuoRntvrtyLIN0GPAB4DPA9sBupC46KstIWExQ2ntsR5OEHUPzx+o02zvXjCtiUetiL0FJF9h+Uu04Bk3SXNtPlnS+7Q17z9WOLbor7wKin52BpwPX2d4N2BhYoW5IEYtWebPxLuA95dRSwBH1IhqYMyRtWDuICu4u3T/+T9JbJb0QWK52UNFtScKinzttPwDcJ2k6cD2wZuWYIha1FwI7UralsH0N0IVegtsCcyVdKuk8SedLOq92UAOwD83q771p2jXtCrymakTReakJi37mSFqRpqXHXOCfwG+rRhSx6N1j25IMUHoJdkHnauEkTQNeZnt/mt9nu1UOKQJITVgsgKS1gem2u/BOOTpE0v40fVGfSbNq7nXAd7uwMrijtXBn2t6qdhwRvZKExTyS1rd9iaTN+l23ffagY4poUxd7CZZauFnA422vJ2k14Gjb21QOrVWSvkyz6fTR9HRGsP2jakFF5yUJi3kkfc32HpJO7nPZtp828KAiYpGSdC6wKXC27U3LufM6sD9avwbmnWhcHsMrNWExj+09ysfta8cSEa3pZC1cWekdMVSShMUEkt4CfMf2zeV4JWAX21+qGlhELApHSfoqsKKk3Wlq4Q6pHFPrykjYhKmfjIRFTZmOjAkknWt7k3HnzhmbuoiIxVtHa+Fe3HO4DM0WJdfY3rtSSBFJwmIiSecDG7n8cJTl3efZfmLdyCIWnfQS7LaycetptreuHUt0VzZrjX6OBY6U9HRJTwe+V85FjJLDgC8D99H0EjycbuyYH411gVVrBxHdlpGwmKC8Q9yTpnURwPHA123fXy+qiEUrvQS7RdJtzF8Tdh3wHts/rBRSRArzY6LSsujL5RYxqubrJQhcTXoJjizbXWhJFYuZTEfGBJK2kXS8pD9KulzSFZIurx1XxCLWyV6CktaV9ANJF5X/35d34f+3pBMX5lzEIGUkLPo5FHgbTd/ITEHGyOl4L8HDgA8An6GphduNEX5DLmkZmmR7lbLdjsql6TQ76EdUkyQs+rnF9i9rBxHRFtv3l/6JXfRw2ydKku2/AAdImgu8v3ZgLdkT2BdYjeaN5VgSdivwhUoxRQApzI8+JH0MmAb8CLh77Hx6R8Yo6WovQUlnANsCPwBOoqmF+5jtx1cNrGWS9upCc/ZYvCQJiwnSOzK6oKu9BCVtDlwMrAh8iGZa7iDbZ9aMaxAkPYmJ+8IdXi+i6LokYRERHVFq4T5eauE6RdIHgO1okrBjgB1oNmvduWZc0W2pCYsJJD0K+Aiwmu0dJG0APMX2oZVDi1hkuthLsOO1cDsDGwPn2N6t/J7L5rxRVZKw6OebNCuo3luO/wgcSbNqMmJU/Lzn83m9BCvFMkjnSJpNx2rhgDttPyDpPknTgeuBNWsHFd2WJCz6WcX2UZLeA2D7PknZqiJGyvid0iV9DzitUjiDtAxwI9Bb42mahTijbI6kFYFDaFZJ/hP4bdWIovOShEU/t0t6JGWqRtJWwC11Q4poXSd6Cdru0p5o89h+c/n0K5KOBabbPq9mTBFJwqKf/YDZwGMlnQ7MoKmniBgZk/QSfFelcAama7Vwkta3fYmkzfpc2yxb70RNWR0ZfUlaEng8zcaGl9q+t3JIEbEISHpxz+G8Wjjbe1cKqVWSvmZ7j2y9E8MoSVhMIOktwHds31yOVwJ2sf2lqoFFLEKSTrT99AWdG3WliflptreuHUtE14xsv7D4t+w+loAB2L4J2L1eOBGLjqRlJK1M6SUoaeVyW5tu9hLsRC2cpLeUwvyx45UkvXmKL4loXWrCop9ppa/cWGH+NGDpyjFFLCqd7iXY1Vo4mjeXXxw7sH2TpN2BjPBHNZmOjAkkHQSsBXy1nNoTuNL22+tFFbFopZdgt0g6H9ho3JvL82w/sW5k0WVJwmKCUiOyJzBWG3M88HXb2SssRkoXewl2tRYuby5jGCUJi4hO6lovQUnLAMsCJ9M877Fp2OnAsbbXrxTaQOTNZQyjJGExj6SjbL+0DNv320doowphRbSi/JyP9RLceKyXoO1nVg6tFZL24cFauKuZvxbuENsjXw8XMWyShMU8kh5t+1pJa/W7bvsvg44poi2Sfm97C0lzge2B24CLOzAi1MlaOEnbAAfQTEkuSZOE2vZjasYV3ZbVkTGP7WvLxyRb0QWd7CVo++Au1sIBhwJvo/leZwoyhkJGwmKePkvX512iecc4fcAhRQxE2SOsE70Eu1YLN0bS72xvWTuOiF5JwiKiU6bqJQgw6r0Eu1YLN0bSx4BpwI+Au8fOj/r3O4ZbpiMjomv2A/YAPtXnmoFR7yV4p+0HJN0naTpwPbBm7aAGYGwUbFbPuS58v2OIJQmLiE6xvUf5uH3tWCrpai1cV7/fMcQyHRkRnZRG9Z2rhXsU8BFgNds7SNoAeIrtQyuHFh2WJCwiOknSubY3GXfuHNubVgqpVamF0y+Bw4D3llq4JWnq4jasHFp0WKYjI6Krutaovuu1cKvYPkrSewBs3ycpW1VEVUnCIqKrjgWOlNTbS/DYivG0KrVw3C7pkZRteCRtBdxSN6ToukxHRkQndbWXYFdr4co07MHAk4ALgBnAzl2oh4vhlSQsIqJDulYL16vUgT2eZgPqS23fWzmk6LglagcQEVGDpG0kHS/pj5Iul3SFpMtrxzUA0ySNNe/uQi0cMG8EcDnbF9q+AFhO0ptrxxXdlpGwiOgkSZfQp5eg7RurBTUAkg6iaWLdWwt3pe2314uqfV0eAYzhlcL8iOiqW2z/snYQFbyLJvF6Uzk+Hvh6vXAGpmurYWMxkJGwiOik9BLslq6OAMZwSxIWEZ0k6eQ+p217pPfLkrQNcABNQrIkTZG6bT+mZlxt6+pq2BhuScIiIjqkq7VwEcMoNWER0Ukd7iXYqVo4SUfZfqmk8ykbtfayvVGFsCKAjIRFREd1tZdg12rhJD3a9rWS1up33fZfBh1TxJgkYRHRSZLOsr157zYF/bYxGDVdrYWLGEaZjoyIrupkL8Gu9Y6UdBt9piF5cEHC9AGHFDFPRsIiopO62kuww7VwEUMnSVhEdFYXewl2tRYuYhild2REdFKHewmuYvso4AEA2/fRs1VFRAxOkrCI6Krdbd88dmD7JmD3euEMTCdr4SKGUQrzI6KrutpLcD9gNvBYSadTauHqhhTRTakJi4hO6nIvwS7WwkUMoyRhEdFJXe0lWGrhvjM2FStpJWAX21+qGlhEByUJi4jokH4b0vZuWBsRg5OasIjolPQS7GwtXMTQSRIWEV2zT/n4vKpR1HMscKSk3lq4YyvGE9FZmY6MiOiQrtbCRQyjJGER0SnpJRgRwyJJWEREB6QWLmL4JAmLiOgASY+2fa2ktfpdt/2XQccU0XVJwiIiIiIqyOrIiIgOSC1cxPDJSFhEREREBUvUDiAiIiKii5KERURERFSQJCwiIiKigiRhERERERUkCYuIzpP0b60U/3e/PiK6KUlYRIwUSa+WdJ6kP0j6tqTnS/qdpHMknSDpUeV+B5TrpwPfljRD0g8lnVVu25T7PULSNyT9vjzGTuX8ayXNlnQScGK9ZxwRi6u8e4uIkSHpicD7gK1t3yBpZZq9sbaybUlvAN4JvL18yQbAtrbvlPRd4DO2T5M0EzgOeALwXuAk26+TtCLwe0knlK/fDNjI9j8G9iQjYmQkCYuIUfI04GjbNwDY/oekDYEjJT0aWBq4ouf+s23fWT5/BrCBpLFr0yUtBzwL2FHS/uX8MsDM8vnxScAi4l+VJCwiRt3BwKdtz5a0HXBAz7Xbez5fgmbE7K7eL1aTlb3Y9qXjzm857usjIh6S1IRFxCg5CXiJpEcClOnIFYCry/XXTPG1vwL2GjuQtEn59Dhgr5KMIWnTRRxzRHRUkrCIGBm2LwQ+DPxa0h+AT9OMfB0taS5wwxRfvjcwqxT1XwS8sZz/ELAUcJ6kC8txRMS/Lb0jIyIiIirISFhEREREBUnCIiIiIipIEhYRERFRQZKwiIiIiAqShEVERERUkCQsIiIiooIkYREREREVJAmLiIiIqOD/AwPpZaidvbnCAAAAAElFTkSuQmCC", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "iVBORw0KGgoAAAANSUhEUgAAAOwAAAD3CAYAAAAewrhMAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjQuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8rg+JYAAAACXBIWXMAAAsTAAALEwEAmpwYAAAgjklEQVR4nO2deZwUxdnHv8+ynAOCCIggCIpHxAOvwSgaJBija+KdN16jxitEfeOboETjGnSNJh6JxijGeE5MPIMnMQYIGuVwPACNKCoiATlEkD167916/6jaddjsze5W98zz/Xzmsz1b3VW/7q5fV3VNdz1ijEFRlGiQ41uAoiitRw2rKBFCDasoEUINqygRQg2rKBFCDasoESKUhhWR90RkYju3HSkiJSLSrWNVgYgYERnT0fl2JiIyXUQe8a0jjIjIRBFZ04XlfSoik7cljxYN2xGFtBVjzFhjzMutWbehPmPMf4wxfY0xNZ0mUFE8EaoWVkRyfWtQLGIJVf0IE53Rg2sNbTohInKuiLwmIreKyJcislJEjm2Q/omIFLu0M9PSLhSR913aMhE50P3/UxGZJiLvAIGI5Ka3mq5L95SIPO62fVtE9ndpfwJGAs+7bvCVIjLKdV1z3TrDROQ5EdksIh+LyIVpmqaLyBMiknR5vyciB7dwGI5z+/iFiNwiIjki0sPlv29a3kNEpFREBjdyHLuJyG0uj5UicmkDzf1F5H4RWScin4nIDXUVpBXnYLSIvOL2ZzYwqEHZh4rIAhHZIiJL0289RORlEfmliMwHSoFdWzgWiMiTIrJeRApF5F8iMjYtbQcReV5EikTkDbcfr7m0rc5TWvkXuOXdROSfIrLJHac/i8iAZnSMFZHZ7jxsEJGr3f97isjtIrLWfW4XkZ5N5PE1p2GLqwvfTUt7SERmiMjfRCQAjhKRPBFZ7PZvtYhMb5Df2SKyyu3DzxukxUVkoStrnYj8XkR6tHS8McY0+wE+BSa75XOBKuBCoBswBVgLCBADioA93bo7AWPd8mnAZ8Ahbt0xwC5p+S8BRgC9GylzuivzVKA7MBVYCXRvuK77PgowQK77/i/gbqAXMA7YCExKy7scOM7tz03AomaOhQHmAQOxF4oPgQtc2t3Ar9PW/THwfBP5/BBYBuwMbA/MaaD5aeAP7pgOAVLAxS2dA5e+EPgN0BM4EigGHnFpw4FNbn9zgKPd98Eu/WXgP8BYINcd7xeAnzVzTH4A9HPl3Q4sSUt7zH36AHsDq4HXGjtPaeXXHc8xTl9PYLA7j7c3oaEfsA74qTvP/YDxLu16YJE7joOBBUCBS5sIrHHL3YGPgauBHsAkd+zq6vNDQCFwuDt2vdz2+7rv+wEbgBPd+nsDJe4c9HTnpJqv6vVBwKHuOI8C3gcub9GP7TDsx2lpfdxBH4qtXFuAU3DGS1vvJeDHzeT/g2bKnE6aidzBWQcc0ZJhsReBGqBfWvpNwENpec9JS9sbKGvBsN9O+/4jYK5bHo+t7HXGeRP4XhP5/BNnQPd9cprmHYGK9GMInA7Ma8U5GOkqRSwt/S98ZdhpwJ8aOTfnpBnm+pbqRDPHZ4DT0h97ManCVXiXfgOtNGwjeZ8ILG4i7fRm0lYAx6V9Pwb4tBHDHgGsB3LS1n0UmJ5m2GQL+3878Fu3fC3wWFpaDKhMr6sNtr0ceLqlY9yee5T1dQvGmFK32NcYEwD/g2091onILBHZy6WPcAeuKVa3UGZ9ujGmFlgDDGuF1mHAZmNMcdr/VmFbmjrWpy2XAr2k+XvpdK2r6nQYY1532090+z0GeK4ZXen5pC/vgr3ar3PdpS3Y1nZIY5rTz4HL90t3LtI1pud9Wl2+Lu8J2N5QY1qaxXXtfyUiK0SkCHvxBNsNH4y9ADW1ny3lvaOIPOZuCYqAR2jQvU+jufo1jK2PQf05a2S91a5+pa+bXle20i8i40VknohsFJFCbN2v07jVOXbnZFPatnuIyAvudqIIuLGZ/aunQwcVjDEvGWOOxlaAD4A/uqTVwG7NbdpC1iPqFsQOhOyM7Qa2tO1aYKCI9Ev730hs97y9jEhbHpmmA+Bh4CzgbOApY0x5E3msw+5DY3muxrawg4wxA9xnO2PMWFpmHbC9iMQaaEzP+09p+Q4wxsSMMb9KW6ctr2+dAZyA7SH0x7aaYG97NmJb+6b2s+6i0iftf0PTlm90WvY1xmyHPa7ShI7VNH2/vRZ7oaqj4TlLX2+EbD3Q1rCuNDw2f8FelEcYY/oD96RpXMfW9bYPsEPatjOwHtnd7d/VNL1/9XSYYd0V8QRXWSqw/fe6q9V9wFQROUgsY0RklyYz+28OEpGTXct3uct/kUvbQBMnyxizGnvPcpOI9BKR/YDzsVfr9nKFiGwvIiOw96mPp6U9ApyErVzJZvJ4AvixiAx3AynT0jSvA/4B3CYi24kd1NpNRL7RkjBjzCpsV/w6sQNhE4DvNND3HRE5xrWOvcT+Frlzoxm2TD/sudiENd6NaVpqgJnAdBHp43odibT0jVgznOW0/ICtL+r9sHWoUESGA1c0o+MFYCcRudwNMvUTkfEu7VHgGhEZLCKDsF3Vxs5/XQ/pShHpLnYw7jvYe/Dm9n+zMaZcROLYC1gdTwHHi8gEN5h0PVv7rR92zKfEHZspzZRTT0e2sDnAT7BXqs3AN+pEGGOeBH6JvSIVA89gB25ay7PY7vaX2NbrZGNMlUu7CXtCtojI1Ea2PR175V+LHcz5hTFmTlt2rBEtb2EHymYB99cluAvE29gr8avN5PFHrCnfARYDf8O2RnW/HSewAx/LsPv8FFt3W5vjDOz99GbgF6RdOJy+E7BX843YlukKmqkHIvJi3YhrIySx3cbPnNZFDdIvxba864E/Yc1TkZZ+oSt/E3aga0Fa2nXAgdiBnllY8zeKu+U5Gmuw9cBHwFEu+QbsRewd4F3s+bmhkTwq3fbHAl9gBxETxpgPmioXO4ZxvYgUYy8ET6Tl9x5wCbbOr8Oex/SHNKZiz1Uxtj6kX/ibpG6AJLS4ofIxxpizfGtpDSLyALDWGHNNG7Y5FrjHGNOWXkfkEJFfA0ONMef41hJV9IfxDkRERgEnk9bqNrFebxE5TuxvzsOxLeHTXSCxSxGRvURkP3cbFMfejmTcfnYlatgOQkQKgH8DtxhjVra0OrbL9yW2S/w+tkuVafTDdmUDbJfvNuwthdJOQt8lVhTlK7SFVZQIoYZVlAihhlWUCKGGVZQIoYZVlAihhlWUCKGGVZQIoYZVlAihhlWUCKGGVZQIoYZVlAihhlWUCKGGVZQIoYZVlAihhlWUCKGGVZQIoYZVlAihhlWUCKGGVZQIoYZVlAihhlWUCKGGVZQIoYZVlAjRXFhFb4jI/2Lj8rxtjDmzpfXbkf90oMQYc2tH591ZJFNBDjYa2q5pn9Huf72wsXh6YENV9sBOVl6FjUla6ZYrgM+BTxp8Pk3EY01F2lNCRCgNiw0yNNkYs6bFNTOMZCrYGRuZe9cGn5FYM3YGJpkK1vGVgVe6v0uAdxPxmM42HxJCZ1gRuQdbQV8UkcewIQj3wVbW6caYZ0XkXGxE7hiwO3ArtlU5G9uKHGeM2SwiFwIXubSPgbPTAiDXlbcbcBc2AHEpcGELEcs6lGQq2A4baW0yNgLbnl1VdhqCDUA8DBvgOZ3Pk6lgLjAbmJ2Ix7LuIhomQhmqQ0Q+BQ7Ghq9cZox5xMVRTQEHAKcB17jlXlgzTjPG3CMivwVWGWNuF5EdjDGbXJ43ABuMMXemd4lFZC7wQ2PMRy6m6E3GmEmdtW/JVJCLbUGPxpo0TggvnM2wHJiDNfC8RDxW5FlPVhH2ivIt4LtpcV978VVE8XkuLmixC1f/vPv/u8B+bnkfZ9QBQF/gpfTMRaQvcBjwpEh98OueHb0TyVQwBBvf9lvYuLn9mt8i1OzpPpcA1clU8AbWvE8l4rF3vSrLAsJuWAFOMcYs3+qftiVMDwxcm/a9lq/26yHgRGPMUteNntgg/xxgizFmXIeqdiRTwRHY+/GTsd3yTCMX+Lr7XJtMBfOxgZCfSsRjlV6VZShh/1nnJeAycc2fiBzQxu37AetEpDvwX6PNxpgiYKWInObyFxHZf1sEJ1NB32QqmJJMBe8A/wK+T2aatTEOB/4MrE6mghuTqWBkSxsobSPsLWwBcDvwjojkYEcvj2/D9vnA68BG97exruiZwAwRuQY7sPUYsLStQpOpYCy2NT27iXKyiSHAVcC0ZCqYhW11X9LR5m0nlINOUSGZCrpju7s/Ao70LCfsrADuAR5IxGObfYuJKmrYdpBMBQKcAdwAjPKrJnIE2EjstyTisRLfYqKGGraNJFPBJOAW4EDfWiLOBmA6cF8iHqv2rCUyqGFbibtHvQU41reWDOMDYFoiHnvOt5AooIZtgWQq6IttCX5M+AfposyLwGWJeGyFbyFhRg3bDMlU8D3gN8Bw31qyhHLg18Cv9GWExlHDNkIyFeyKHdE82reWLGUFMCURj832LSRsqGEbkEwFJ2KfkOrvV0nWY4AbgWsT8VitbzFhQQ3rcA/l3wRMbWldpUuZC5yRiMc+9y0kDKhhgWQq2Al4HDjCtxalUdYC30vEY/N9C/FN2J8l7nSSqWAisBg1a5gZBrycTAU/9S3EN1nbwrqnlX6GfV65m2c5SuuZCZyXre/hZqVhk6lgAJAEvuNZitI+PgJOTcRj7/gW0tVkXZc4mQr2Bd5GzRpldgcWJVPBWb6FdDVZ1cImU8H+2FHHHXxrUToEA1yUiMfu8y2kq8iaFlbNmpEIcG8yFVzgW0hXkRWGVbNmNFll2ow3rJo1K8ga02a0YdWsWUVWmDZjDatmzUoy3rQZaVg1a1aT0abNuJ91kqlgH+Bl1KzZjgHOT8RjD/oW0pFklGGTqaA/8BY2Ho+iVAJHJuKx130L6SgyrUv8EGpW5St6AE8mU0HG9LYyxrDJVHAFNqKdoqQzAvizi68beTJiJ1wMmxt961BCyzHYKBCRJ/L3sMlUsCP2fdadfGtRQk0tcGwiHvuHbyHbQqQNm0wF3bCxSid6lqJEgy+AA6IclDrqXeIbULMqrWcQdhCqu28h7SWyhk2mgu8A03zrUCLHocCtvkW0l0h2iZOpYBdgCTayemgIirfwwC8v4bNPloEIF1wzg5ceu4v1qz4CoLSkkD59+1PwyEI+XLqQh2++nNzcHkwpeJChI8cQFG/hrqsTTL3jGXJyInstjQqnJeKxp3yLaCtRNewLQJ5vHQ2597qL2GPcYUw84VyqqyqpKC8l1m9Affqjd1xF79h2nHjBVfxu2umc9ZNb+WLdKt565XlO//FNPHrH1Yyb8G2+dpBGruwCPgf2TMRjW3wLaQuRu4wnU8EJhNCspSWFLF88n2989xwAcrv32MqsxhhSc2Zy6LdOA6BbbncqK0qpKC+jW253Nqz5hM2fr1Gzdh1DsGMgkSJShk2mgj7AHb51NMbGtavot/0g7iv4IflnH8b9v7yEirKgPn35kvlsN3AIQ0eOAeD4c6Zy7/SLeOHhW5l86sX8dcZ1nHLxtb7kZytTkqkgUmFDI2VY4BpgF98iGqO2pppVy5cw6eQLKPjTAnr26sMLD99Wn77oH0/Wt64Au+yxH9c+MI+rZrzI52tX0n/QUMBw188T3POL8ynctMHDXmQdOcCMKD0FFRmhyVSwBxDaiaS3HzKcgUOGs9s+hwBwyKQTWbV8KQA11dW8Ne85xk8+5b+2M8bw3AM3c8IPpvHMfTfxP5fewMQTzmX2EzO6VH8WEwfO9y2itUTGsNgwhD18i2iKATvsyMAhw1m36kMAlr35MsNG7wXAe2/MY6dRezBwx/+OWjn/b39h/8OOoW//gVSUlyI5OYjkUFFe1qX6s5wCFwc49EQiQHEyFUwgAg/2nzX1Nu659nyqqysZMmw0F+TbVvL12U9t1R2uo6K8lFdfeIQr7rTBx799+mX85v9OpltuD6YUPNCl2rOcHYErgF/4FtISkfhZJ5kKFmJ/8FaUziIAdk/EY+t8C2mO0HeJk6ngVNSsSucTA67zLaIlQt3CutG7D7ChGRSls6kBxibiseW+hTRF2FvY41GzKl1HN+Ay3yKaI+yG/ZFvAUrWcXaYR4xDa9hkKtgN+JZvHUrWsR0Q2qh4oTUsMAU7x6yidDVTfAtoilAOOiVTQS/gM2Cgby1K1nJEIh57zbeIhoS1hf0+albFL6EcPwmrYUN5sJSs4pRkKhjiW0RDQmfYZCo4GDjEtw4l6+kBhC4+T+gMi7auSni4OGyv3oVKTDIVbI+9f1WUMDAS+/BOaAiVYYGTgd6+RShKGmf6FpBO2Ax7tG8BitKAb4apWxwaIclUIMA3fetQlAbsABzgW0QdoTEsMA47M7uihI3JvgXUESbDandYCSuhqZtqWEVpmcPd47LeCYVh3cGY4FuHojRBL+AI3yIgJIbFmjUUVzBFaYJQ3MeGxbDaHVbCTijqaFgMG4qrl6I0w7hkKvD+K4Z3w7qDEJrfuRSlCULxnIB3wwIHoTNLKNEg7ltAGAy7m28BitJKdvUtIAyG9X4QFKWVeK+ralhFaT2jfQtQwypK6+mXTAWDfQoIg2G9X7UUpQ14ra9eDZtMBTtgJ25WlKjgtUfou4XV7rASNdSwihIhstqwev+qRI3svYdFW1glemR1C7uz5/IVpa14rbO+DavvwCpRIzeZCrr5Kty3Ybt7Ll9R2oO3euvbsD08l68o7cFbvfVtWG1hlSiiLayiRAhv9TbXV8FK57Fd9eZVJ3z5cG8wen47gUrpZeAKL2X7PqFVnsvPSCYXztwgGO+zI2QqPU15ta+yfXeJ1bAdzMiKD9/uW1ukZu1cvNVb34at9Fx+RiGmtmZC0d/7+daRBXirt74Nqy1sB3Jg8Or8XKp3960jC8jaFrbCc/kZQ8/asi/3LntrX986soBa8vKz9h52vefyM4aJRc+9K7C9bx1ZgNc669uwn3guPyPYvurzFUOqPjvMt44swWudVcNmAJMLZ24R/z/RZQtqWKX9jCl7N9XblB7kW0cWoYZV2keOqakcXzJ3R986sozsNWwiHlsPlPnUEGXGl8xd2I3aXXzryDJW+izcdwsLng9AVOldU7JxTPm/D/StIwvJ3hbWod3idjCp6JnlAvpUU9dSBqzzKUANG0GGVK15f2D15/ozTtfzKXn5xqeAMBhWu8Rt5KjCZ6skHOcu2/BeV8Nw0rWFbQN7l765oKep2M+3jizFe10Ng2EX+xYQFbqZqtIDg1dH+daRxXivq94Nm4jHVgPLfeuIAocXv/RGDmaYbx1ZzGzfArwb1jHHt4CwE6spXLtLxYf6Yro/PiQvf7VvEWExrPcrV9iZXDhzlUBv3zqymFDU0bAYdh7g7R3DsDOsYuU7/Wu+/LpvHVlOKHqBoTBsIh4rAt7wrSOUGFP7jaIXdP5mv9RgGxXvhMKwjlB0OcLG/qULF3Sn6mu+dWQ5b5CXX+hbBKhhQ0332oqi/Upf39O3DiU8dTNMhl0EFPsWESaOLHphsWAG+9ahhOP+FUJk2EQ8Vg284ltHWOhfvenTYVWrdKDJPyXAQt8i6giNYR2h6Xr4ZnLhzM9FYw+FgVfIyw/NdLxhM+xM7IhcVjOq/IO3YrXF+pBEOHjSt4B0QmXYRDy2Bnjetw6fiKmtPqz4pQG+dSgAbAIe9y0inVAZ1nG3bwE+OTh4ZUEuNbv51qEA8CB5+eW+RaQTRsPOAT70LcIHPWtLN+9VtlhfnQsHBpjhW0RDQmfYRDxmgHt86/DBUYXP/VtggG8dCgAvkZfv/f3XhoTOsI4HgVLfIrqSgVUbPhpcvfZw3zqUekJ5axZKwybisS3AY751dCWTC2eWCHTzrUMBYBUwy7eIxgilYR13+RbQVexetvT1XqbsAN86lHr+QF5+rW8RjRFawybisbeBlG8dnU2Oqa4YXzJvJ986lHoqgft8i2iK0BrWEcr7iI7k0OI5C3OoHelbh1LPU+Tlb/QtoinCbtjHgc99i+gs+tQUb9itYtnBvnUoW3GnbwHNEWrDJuKxcuB63zo6i0mFT38s0Ne3DqWeZ8nLX+RbRHOE2rCOP5CBD1LsWLl62fY1X+js/eGhGpjmW0RLhD4IcCIeq06mgquAv/rW0mEYY44qerZWQHxLaYryyiqOnPYAFVXVVNfWcurhY7nuzEmcf8czvPnRZxhgj2E78ND/nUTf3j258/lF/OHFNxk5uD/PXHM6Pbrn8tp7q/jrgmX89sJjfe9Oa7ifvPzQT7crxngNFdJqkqlgPpARLdLY0jfmHxS8GuqHJIwxBOWV9O3dk6rqGiZceR93XHQce48czHZ9egHwkz++yJABMX522pEc+tN7WXDLBdz4xL/Yf/RQjo/vybevTfLolacxsF8fz3vTIiXAGPLyN/gW0hJR6BLXMRX7fGekyTWVwQHBa7v61tESIkLf3j0BqKquoaqmFhHqzWqMoayyGhGp/15VU0tpRRXdc7vxyLylHHvw7lEwK8DNUTArRMiwiXhsIfCwbx3byoSiv7+Zg4nE7641NbWMu+xuhpx1M0eP243xe44A4Lzbn2bo2TfzwZqNXHb8eAAuPX48h/70Xv6zsZDDvzaSB+cs5pK88T7lt5YVwC2+RbSWyHSJAZKpYDA2rMf2vrW0h741W9actPmBQQK9fGtpC1tKyjjpl49y58V57DNqR8Ca+bI/zOKQ3Ydz3tFbx5W+/tF57DdqKDk5QnLuEkYM7s9t5x9DTk4o24djycv/u28RrSWUR7ApEvHYRuBq3zray+QtM9dEzawAA/r25qj9RvP3tz+q/1+3bjl8/8h9+euCZVutu3ZTEakPP+PEr3+N256ez+PTvseAWC/mLg3diy8AM6NkVoiYYR33Am/6FtFWhld8snS72i2H+tbRWjYWBmwpKQOgrKKK2YtXsOfwQXy8dhNg71mfe/0D9tp50Fbb5T/yT64/c5LbrhoRyBGhtCI00yLVEQCX+xbRVkL/s05DEvFYbTIVXIydyS4ak5TZ2fsj1bKu21zMOb+dSU2tobbW8L0jxpJ3yB4cMe1+ikorMAb2Hz2UGZccX7/N4hXrADhwjA2wd8bEfdn30rsYMag/V546wct+NEN+GIJbtZVI3cOmk0wFlwC/962jNRxQ8tqr+5aljvCtQ6nnGfLyT/Itoj1EsUsMQCIeuwt41LeOluheW164T1lKQ22EhxXAub5FtJfIGtZxIfC+bxHNMbHohSUCg1peU+kCyoFTwxInpz1E2rCJeCwATsE+qRI6BlRvXDm06j8Z8XRWhnApeflLfIvYFiJtWIBEPPY+cJFvHY3xzcKnvxDQUJHh4EHy8u/3LWJbibxhARLx2KOEbEqZ0eXvvxmrLTnEtw4FgKXAJb5FdAQZYVjHTwjJlDJiaqoOK/7HQN86FAAKsfetZb6FdAQZY9hEPFYJnIYNr+CVeMnLC7pRE/oH/LOE88jL/9i3iI4iYwwLkIjH/gOcjp1Iyws9a0s37VG+dJyv8pWtuJG8/Kd9i+hIMsqwAIl4bDZwMp5MO6nwmWUC/X2UrWzFreTl/9y3iI4m4wwLkIjHZuHBtIOq1i0fVL0+1C+mZwm3kpd/hW8RnUFGGhb8mHZS4dNlksHHNCJkrFkhwytXV5p2z7Ili3qZ8nGdXY7SLBltVshww0LXmLabqS4/pOTlnTsrf6VVZLxZIQsMC51v2q8Xz349h1o1rD+ywqyQJYaFzjNtn5ri9aMr3tfZ+/2RNWaFLDIs1Jv2RKCoo/L8ZuHMFQKxjspPaTUGuCGbzApZZliARDz2InAw8O625jW0ctW/B9Rs0rdxup4twInk5ef7FtLVZJ1hARLx2EfAoUCy3ZkYYyYWPS9hnr0/Q1kMHERe/nO+hfggslPEdBTJVHAhNmJZz7Zst0/w+vwDS+frQxJdyx+B/yUvv9y3EF9kvWEBkqngQOApYHRr1s+trSz5/qa7SnIwQztXmeIoA6aQlx/5ieS3lazsEjfERXs/EHi+NesfUfy3t9SsXcZHwHg1q0UN60jEY1uAE4CrgJqm1utX/eXqnSs/icz8whHnr8DB5OVv8wBhpqBd4kZIpoJvAPcBYxqmnbTp/kX9agvVsJ1LMXA1efmRmMa2K9EWthES8dgrwD7AtdiZ9gAYUfHxYjVrp/MYsJeatXG0hW2BZCrYFfidmNpvn/7F71fkUr2Hb00ZygfYWQ3n+hYSZtSwreTNl1855uDgX78D1LAdSyFwE/Bb8vK9zRQSFdSwbWFWQS52StVfAEM8q4k6VcAMoIC8/C98i4kKatj2MKugH3AldqbGSIQYDxlPYAeVVvgWEjXUsNvCrIKhwMXYkCHDPasJO6XYWEi/j/rs+z5Rw3YEtqt8AvAjYJJnNWHjQ2zX9yHy8rd0VaEiMhGYaow5voVVI4UatqOZVbAXMAU4h+ydPbEGeA64G5hLXn6XVzI1rNI2ZhXEgDOwre44v2K6jPXYB/TvJS9/zbZmJiKjgL8Di4DDgDeAB4HrsIN+Z7pV7wB6YZ85Ps8YszzdsCISw77gsQ821tF0Y8yz26rPB2rYrmBWwdeBs4GjaeTpqYizCZiLfYzwafLyqzoqY2fYj4EDgPewhl0KnA98FzgPSAClxphqEZkMTDHGnNLAsDcCy4wxj4jIAGxIlwOMMUFHae0qcn0LyAry8hcCCwGYVTAKmIw17ySiFzu2HHgNmAPMBhZ3cpd3pTHmXQAReQ+Ya4wxIvIuMAp72/GwiOyOnYWisWiB3wK+KyJT3fdewEhCHlu4MdSwXU1e/qfY55TvY1aBYFuPo7EmnoCtTGHCAEuw5pwDvNrF76NWpC3Xpn2vxdbfAmCeMeYk1yK/3EgeApxijFneiTq7BDWsT2zL9Lb7/JpZBb2wpj0U2DXtM5yuee77C+ATYKX7uxQ7aBTmBxv6A5+55XObWOcl4DIRucy1zgcYYxZ3iboORg0bJmzLNcd9vmJWQQ9gF7Y28a7YF+5HYFvlHtjuYGNT1lS5TyWwAWvG9I81aF5+cUfvUhdwM7ZLfA0wq4l1CoDbgXdEJAe7v5EcPdZBp0zD/ibcA2vcKn0+N7NQwypKhND3YRUlQqhhFSVCqGEVJUKoYRUlQqhhFSVCqGEVJUKoYRUlQqhhFSVCqGEVJUKoYRUlQqhhFSVCqGEVJUKoYRUlQqhhFSVCqGEVJUKoYRUlQqhhFSVCqGEVJUKoYRUlQqhhFSVCqGEVJUKoYRUlQqhhFSVCqGEVJUKoYRUlQqhhFSVCqGEVJUL8P24u4KANyzWDAAAAAElFTkSuQmCC", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "grafLocation(df2)" + ] + }, + { + "cell_type": "code", + "execution_count": 139, + "id": "8d085203", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
gender_femalegender_malecareer_actuariocareer_agronomíacareer_arquitecturacareer_bioquímicacareer_ciencias veterinariascareer_contador públicocareer_diseño de imagen y sonidocareer_diseño industrial...career_licenciatura en kinesiología y fisiatríacareer_licenciatura en musicoterapiacareer_licenciatura en planificación y diseño del paisajecareer_licenciatura en producción de bioimagenescareer_licenciatura en psicologíacareer_licenciatura en relaciones del trabajocareer_licenciatura en sociologíacareer_licenciatura en terapia ocupacionalcareer_medicinacareer_técnico para bioterios
count1831.0000001831.0000001831.0000001831.0000001831.0000001831.0000001831.0000001831.0000001831.0000001831.000000...1831.0000001831.0000001831.0000001831.0000001831.0000001831.0000001831.0000001831.0000001831.0000001831.000000
mean0.4937190.5062810.0333150.0262150.0278540.0284000.0294920.0262150.0333150.037138...0.0267610.0360460.0344070.0316770.0251230.0240310.0316770.0289460.0393230.028946
std0.5000970.5000970.1795070.1598180.1645980.1661570.1692270.1598180.1795070.189152...0.1614290.1864550.1823230.1751860.1565410.1531860.1751860.1677000.1944150.167700
min0.0000000.0000000.0000000.0000000.0000000.0000000.0000000.0000000.0000000.000000...0.0000000.0000000.0000000.0000000.0000000.0000000.0000000.0000000.0000000.000000
25%0.0000000.0000000.0000000.0000000.0000000.0000000.0000000.0000000.0000000.000000...0.0000000.0000000.0000000.0000000.0000000.0000000.0000000.0000000.0000000.000000
50%0.0000001.0000000.0000000.0000000.0000000.0000000.0000000.0000000.0000000.000000...0.0000000.0000000.0000000.0000000.0000000.0000000.0000000.0000000.0000000.000000
75%1.0000001.0000000.0000000.0000000.0000000.0000000.0000000.0000000.0000000.000000...0.0000000.0000000.0000000.0000000.0000000.0000000.0000000.0000000.0000000.000000
max1.0000001.0000001.0000001.0000001.0000001.0000001.0000001.0000001.0000001.000000...1.0000001.0000001.0000001.0000001.0000001.0000001.0000001.0000001.0000001.000000
\n", + "

8 rows × 35 columns

\n", + "
" + ], + "text/plain": [ + " gender_female gender_male career_actuario career_agronomía \\\n", + "count 1831.000000 1831.000000 1831.000000 1831.000000 \n", + "mean 0.493719 0.506281 0.033315 0.026215 \n", + "std 0.500097 0.500097 0.179507 0.159818 \n", + "min 0.000000 0.000000 0.000000 0.000000 \n", + "25% 0.000000 0.000000 0.000000 0.000000 \n", + "50% 0.000000 1.000000 0.000000 0.000000 \n", + "75% 1.000000 1.000000 0.000000 0.000000 \n", + "max 1.000000 1.000000 1.000000 1.000000 \n", + "\n", + " career_arquitectura career_bioquímica career_ciencias veterinarias \\\n", + "count 1831.000000 1831.000000 1831.000000 \n", + "mean 0.027854 0.028400 0.029492 \n", + "std 0.164598 0.166157 0.169227 \n", + "min 0.000000 0.000000 0.000000 \n", + "25% 0.000000 0.000000 0.000000 \n", + "50% 0.000000 0.000000 0.000000 \n", + "75% 0.000000 0.000000 0.000000 \n", + "max 1.000000 1.000000 1.000000 \n", + "\n", + " career_contador público career_diseño de imagen y sonido \\\n", + "count 1831.000000 1831.000000 \n", + "mean 0.026215 0.033315 \n", + "std 0.159818 0.179507 \n", + "min 0.000000 0.000000 \n", + "25% 0.000000 0.000000 \n", + "50% 0.000000 0.000000 \n", + "75% 0.000000 0.000000 \n", + "max 1.000000 1.000000 \n", + "\n", + " career_diseño industrial ... \\\n", + "count 1831.000000 ... \n", + "mean 0.037138 ... \n", + "std 0.189152 ... \n", + "min 0.000000 ... \n", + "25% 0.000000 ... \n", + "50% 0.000000 ... \n", + "75% 0.000000 ... \n", + "max 1.000000 ... \n", + "\n", + " career_licenciatura en kinesiología y fisiatría \\\n", + "count 1831.000000 \n", + "mean 0.026761 \n", + "std 0.161429 \n", + "min 0.000000 \n", + "25% 0.000000 \n", + "50% 0.000000 \n", + "75% 0.000000 \n", + "max 1.000000 \n", + "\n", + " career_licenciatura en musicoterapia \\\n", + "count 1831.000000 \n", + "mean 0.036046 \n", + "std 0.186455 \n", + "min 0.000000 \n", + "25% 0.000000 \n", + "50% 0.000000 \n", + "75% 0.000000 \n", + "max 1.000000 \n", + "\n", + " career_licenciatura en planificación y diseño del paisaje \\\n", + "count 1831.000000 \n", + "mean 0.034407 \n", + "std 0.182323 \n", + "min 0.000000 \n", + "25% 0.000000 \n", + "50% 0.000000 \n", + "75% 0.000000 \n", + "max 1.000000 \n", + "\n", + " career_licenciatura en producción de bioimagenes \\\n", + "count 1831.000000 \n", + "mean 0.031677 \n", + "std 0.175186 \n", + "min 0.000000 \n", + "25% 0.000000 \n", + "50% 0.000000 \n", + "75% 0.000000 \n", + "max 1.000000 \n", + "\n", + " career_licenciatura en psicología \\\n", + "count 1831.000000 \n", + "mean 0.025123 \n", + "std 0.156541 \n", + "min 0.000000 \n", + "25% 0.000000 \n", + "50% 0.000000 \n", + "75% 0.000000 \n", + "max 1.000000 \n", + "\n", + " career_licenciatura en relaciones del trabajo \\\n", + "count 1831.000000 \n", + "mean 0.024031 \n", + "std 0.153186 \n", + "min 0.000000 \n", + "25% 0.000000 \n", + "50% 0.000000 \n", + "75% 0.000000 \n", + "max 1.000000 \n", + "\n", + " career_licenciatura en sociología \\\n", + "count 1831.000000 \n", + "mean 0.031677 \n", + "std 0.175186 \n", + "min 0.000000 \n", + "25% 0.000000 \n", + "50% 0.000000 \n", + "75% 0.000000 \n", + "max 1.000000 \n", + "\n", + " career_licenciatura en terapia ocupacional career_medicina \\\n", + "count 1831.000000 1831.000000 \n", + "mean 0.028946 0.039323 \n", + "std 0.167700 0.194415 \n", + "min 0.000000 0.000000 \n", + "25% 0.000000 0.000000 \n", + "50% 0.000000 0.000000 \n", + "75% 0.000000 0.000000 \n", + "max 1.000000 1.000000 \n", + "\n", + " career_técnico para bioterios \n", + "count 1831.000000 \n", + "mean 0.028946 \n", + "std 0.167700 \n", + "min 0.000000 \n", + "25% 0.000000 \n", + "50% 0.000000 \n", + "75% 0.000000 \n", + "max 1.000000 \n", + "\n", + "[8 rows x 35 columns]" + ] + }, + "execution_count": 139, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "dfg1.describe()" + ] + }, + { + "cell_type": "code", + "execution_count": 140, + "id": "e30911e0", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
gender_femalegender_malecareer_actuariocareer_agronomíacareer_arquitecturacareer_bioquímicacareer_ciencias veterinariascareer_contador públicocareer_diseño de imagen y sonidocareer_diseño industrial...career_licenciatura en kinesiología y fisiatríacareer_licenciatura en musicoterapiacareer_licenciatura en planificación y diseño del paisajecareer_licenciatura en producción de bioimagenescareer_licenciatura en psicologíacareer_licenciatura en relaciones del trabajocareer_licenciatura en sociologíacareer_licenciatura en terapia ocupacionalcareer_medicinacareer_técnico para bioterios
count1904.0000001904.0000001904.0000001904.0000001904.0000001904.0000001904.0000001904.0000001904.0000001904.000000...1904.0000001904.0000001904.0000001904.0000001904.0000001904.0000001904.0000001904.0000001904.0000001904.000000
mean0.5215340.4784660.0288870.0252100.0204830.0267860.0288870.0357140.0330880.029937...0.0309870.0367650.0299370.0304620.0278360.0304620.0309870.0320380.0294120.026786
std0.4996670.4996670.1675320.1568040.1416830.1614990.1675320.1856260.1789140.170458...0.1733290.1882330.1704580.1719000.1645460.1719000.1733290.1761470.1690020.161499
min0.0000000.0000000.0000000.0000000.0000000.0000000.0000000.0000000.0000000.000000...0.0000000.0000000.0000000.0000000.0000000.0000000.0000000.0000000.0000000.000000
25%0.0000000.0000000.0000000.0000000.0000000.0000000.0000000.0000000.0000000.000000...0.0000000.0000000.0000000.0000000.0000000.0000000.0000000.0000000.0000000.000000
50%1.0000000.0000000.0000000.0000000.0000000.0000000.0000000.0000000.0000000.000000...0.0000000.0000000.0000000.0000000.0000000.0000000.0000000.0000000.0000000.000000
75%1.0000001.0000000.0000000.0000000.0000000.0000000.0000000.0000000.0000000.000000...0.0000000.0000000.0000000.0000000.0000000.0000000.0000000.0000000.0000000.000000
max1.0000001.0000001.0000001.0000001.0000001.0000001.0000001.0000001.0000001.000000...1.0000001.0000001.0000001.0000001.0000001.0000001.0000001.0000001.0000001.000000
\n", + "

8 rows × 35 columns

\n", + "
" + ], + "text/plain": [ + " gender_female gender_male career_actuario career_agronomía \\\n", + "count 1904.000000 1904.000000 1904.000000 1904.000000 \n", + "mean 0.521534 0.478466 0.028887 0.025210 \n", + "std 0.499667 0.499667 0.167532 0.156804 \n", + "min 0.000000 0.000000 0.000000 0.000000 \n", + "25% 0.000000 0.000000 0.000000 0.000000 \n", + "50% 1.000000 0.000000 0.000000 0.000000 \n", + "75% 1.000000 1.000000 0.000000 0.000000 \n", + "max 1.000000 1.000000 1.000000 1.000000 \n", + "\n", + " career_arquitectura career_bioquímica career_ciencias veterinarias \\\n", + "count 1904.000000 1904.000000 1904.000000 \n", + "mean 0.020483 0.026786 0.028887 \n", + "std 0.141683 0.161499 0.167532 \n", + "min 0.000000 0.000000 0.000000 \n", + "25% 0.000000 0.000000 0.000000 \n", + "50% 0.000000 0.000000 0.000000 \n", + "75% 0.000000 0.000000 0.000000 \n", + "max 1.000000 1.000000 1.000000 \n", + "\n", + " career_contador público career_diseño de imagen y sonido \\\n", + "count 1904.000000 1904.000000 \n", + "mean 0.035714 0.033088 \n", + "std 0.185626 0.178914 \n", + "min 0.000000 0.000000 \n", + "25% 0.000000 0.000000 \n", + "50% 0.000000 0.000000 \n", + "75% 0.000000 0.000000 \n", + "max 1.000000 1.000000 \n", + "\n", + " career_diseño industrial ... \\\n", + "count 1904.000000 ... \n", + "mean 0.029937 ... \n", + "std 0.170458 ... \n", + "min 0.000000 ... \n", + "25% 0.000000 ... \n", + "50% 0.000000 ... \n", + "75% 0.000000 ... \n", + "max 1.000000 ... \n", + "\n", + " career_licenciatura en kinesiología y fisiatría \\\n", + "count 1904.000000 \n", + "mean 0.030987 \n", + "std 0.173329 \n", + "min 0.000000 \n", + "25% 0.000000 \n", + "50% 0.000000 \n", + "75% 0.000000 \n", + "max 1.000000 \n", + "\n", + " career_licenciatura en musicoterapia \\\n", + "count 1904.000000 \n", + "mean 0.036765 \n", + "std 0.188233 \n", + "min 0.000000 \n", + "25% 0.000000 \n", + "50% 0.000000 \n", + "75% 0.000000 \n", + "max 1.000000 \n", + "\n", + " career_licenciatura en planificación y diseño del paisaje \\\n", + "count 1904.000000 \n", + "mean 0.029937 \n", + "std 0.170458 \n", + "min 0.000000 \n", + "25% 0.000000 \n", + "50% 0.000000 \n", + "75% 0.000000 \n", + "max 1.000000 \n", + "\n", + " career_licenciatura en producción de bioimagenes \\\n", + "count 1904.000000 \n", + "mean 0.030462 \n", + "std 0.171900 \n", + "min 0.000000 \n", + "25% 0.000000 \n", + "50% 0.000000 \n", + "75% 0.000000 \n", + "max 1.000000 \n", + "\n", + " career_licenciatura en psicología \\\n", + "count 1904.000000 \n", + "mean 0.027836 \n", + "std 0.164546 \n", + "min 0.000000 \n", + "25% 0.000000 \n", + "50% 0.000000 \n", + "75% 0.000000 \n", + "max 1.000000 \n", + "\n", + " career_licenciatura en relaciones del trabajo \\\n", + "count 1904.000000 \n", + "mean 0.030462 \n", + "std 0.171900 \n", + "min 0.000000 \n", + "25% 0.000000 \n", + "50% 0.000000 \n", + "75% 0.000000 \n", + "max 1.000000 \n", + "\n", + " career_licenciatura en sociología \\\n", + "count 1904.000000 \n", + "mean 0.030987 \n", + "std 0.173329 \n", + "min 0.000000 \n", + "25% 0.000000 \n", + "50% 0.000000 \n", + "75% 0.000000 \n", + "max 1.000000 \n", + "\n", + " career_licenciatura en terapia ocupacional career_medicina \\\n", + "count 1904.000000 1904.000000 \n", + "mean 0.032038 0.029412 \n", + "std 0.176147 0.169002 \n", + "min 0.000000 0.000000 \n", + "25% 0.000000 0.000000 \n", + "50% 0.000000 0.000000 \n", + "75% 0.000000 0.000000 \n", + "max 1.000000 1.000000 \n", + "\n", + " career_técnico para bioterios \n", + "count 1904.000000 \n", + "mean 0.026786 \n", + "std 0.161499 \n", + "min 0.000000 \n", + "25% 0.000000 \n", + "50% 0.000000 \n", + "75% 0.000000 \n", + "max 1.000000 \n", + "\n", + "[8 rows x 35 columns]" + ] + }, + "execution_count": 140, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "dft2.describe()" + ] + }, + { + "cell_type": "code", + "execution_count": 141, + "id": "65adf584", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
countuniquetopfreq
careeragegender
actuario17female41actuario4
male21actuario2
18female11actuario1
19female21actuario2
male41actuario4
.....................
técnico para bioterios35female21técnico para bioterios2
male31técnico para bioterios3
37female11técnico para bioterios1
male21técnico para bioterios2
39female21técnico para bioterios2
\n", + "

863 rows × 4 columns

\n", + "
" + ], + "text/plain": [ + " count unique top freq\n", + "career age gender \n", + "actuario 17 female 4 1 actuario 4\n", + " male 2 1 actuario 2\n", + " 18 female 1 1 actuario 1\n", + " 19 female 2 1 actuario 2\n", + " male 4 1 actuario 4\n", + "... ... ... ... ...\n", + "técnico para bioterios 35 female 2 1 técnico para bioterios 2\n", + " male 3 1 técnico para bioterios 3\n", + " 37 female 1 1 técnico para bioterios 1\n", + " male 2 1 técnico para bioterios 2\n", + " 39 female 2 1 técnico para bioterios 2\n", + "\n", + "[863 rows x 4 columns]" + ] + }, + "execution_count": 141, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df1.career.groupby([df1.career,df1.age,df1.gender]).describe()\n", + "\n", + "\n" + ] + }, + { + "cell_type": "code", + "execution_count": 142, + "id": "6237473f", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
countuniquetopfreq
careeragegender
actuario17female51actuario5
18female11actuario1
19female11actuario1
male11actuario1
21female11actuario1
.....................
técnico para bioterios33female21técnico para bioterios2
male11técnico para bioterios1
35female31técnico para bioterios3
37male51técnico para bioterios5
39male21técnico para bioterios2
\n", + "

819 rows × 4 columns

\n", + "
" + ], + "text/plain": [ + " count unique top freq\n", + "career age gender \n", + "actuario 17 female 5 1 actuario 5\n", + " 18 female 1 1 actuario 1\n", + " 19 female 1 1 actuario 1\n", + " male 1 1 actuario 1\n", + " 21 female 1 1 actuario 1\n", + "... ... ... ... ...\n", + "técnico para bioterios 33 female 2 1 técnico para bioterios 2\n", + " male 1 1 técnico para bioterios 1\n", + " 35 female 3 1 técnico para bioterios 3\n", + " 37 male 5 1 técnico para bioterios 5\n", + " 39 male 2 1 técnico para bioterios 2\n", + "\n", + "[819 rows x 4 columns]" + ] + }, + "execution_count": 142, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df2.career.groupby([df2.career,df2.age,df2.gender]).describe()" + ] + }, + { + "cell_type": "code", + "execution_count": 143, + "id": "85952af2", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "73" + ] + }, + "execution_count": 143, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "dif = len(df2)-len(df1)\n", + "dif" + ] + }, + { + "cell_type": "code", + "execution_count": 144, + "id": "2abb3d0a", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "3.8340336134453783" + ] + }, + "execution_count": 144, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "dif/len(df2)*100" + ] + }, + { + "cell_type": "code", + "execution_count": 145, + "id": "05e675f2", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "univ. nacional del comahue\n", + "29 170\n" + ] + } + ], + "source": [ + "ma=df1.university.groupby(df1.age).describe()\n", + "\n", + "# dat['count'].unique()\n", + "f =ma['count'] == ma['count'].max()\n", + "name_L=ma[f].index[0]\n", + "# loca =df1.location == ma[f].index[0]\n", + "name_L\n", + "ma\n", + "print(df1.university[0])\n", + "print(name_L, ma['count'].max())\n" + ] + }, + { + "cell_type": "code", + "execution_count": 146, + "id": "9e50c6c6", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
countuniquetopfreq
age
171361univ. nacional del comahue136
18161univ. nacional del comahue16
191251univ. nacional del comahue125
20161univ. nacional del comahue16
211221univ. nacional del comahue122
22171univ. nacional del comahue17
231211univ. nacional del comahue121
24181univ. nacional del comahue18
251441univ. nacional del comahue144
26111univ. nacional del comahue11
271251univ. nacional del comahue125
28211univ. nacional del comahue21
291701univ. nacional del comahue170
30151univ. nacional del comahue15
311461univ. nacional del comahue146
32141univ. nacional del comahue14
331281univ. nacional del comahue128
34181univ. nacional del comahue18
351501univ. nacional del comahue150
36121univ. nacional del comahue12
371481univ. nacional del comahue148
38241univ. nacional del comahue24
391201univ. nacional del comahue120
40141univ. nacional del comahue14
\n", + "
" + ], + "text/plain": [ + " count unique top freq\n", + "age \n", + "17 136 1 univ. nacional del comahue 136\n", + "18 16 1 univ. nacional del comahue 16\n", + "19 125 1 univ. nacional del comahue 125\n", + "20 16 1 univ. nacional del comahue 16\n", + "21 122 1 univ. nacional del comahue 122\n", + "22 17 1 univ. nacional del comahue 17\n", + "23 121 1 univ. nacional del comahue 121\n", + "24 18 1 univ. nacional del comahue 18\n", + "25 144 1 univ. nacional del comahue 144\n", + "26 11 1 univ. nacional del comahue 11\n", + "27 125 1 univ. nacional del comahue 125\n", + "28 21 1 univ. nacional del comahue 21\n", + "29 170 1 univ. nacional del comahue 170\n", + "30 15 1 univ. nacional del comahue 15\n", + "31 146 1 univ. nacional del comahue 146\n", + "32 14 1 univ. nacional del comahue 14\n", + "33 128 1 univ. nacional del comahue 128\n", + "34 18 1 univ. nacional del comahue 18\n", + "35 150 1 univ. nacional del comahue 150\n", + "36 12 1 univ. nacional del comahue 12\n", + "37 148 1 univ. nacional del comahue 148\n", + "38 24 1 univ. nacional del comahue 24\n", + "39 120 1 univ. nacional del comahue 120\n", + "40 14 1 univ. nacional del comahue 14" + ] + }, + "execution_count": 146, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "ma" + ] + }, + { + "cell_type": "code", + "execution_count": 147, + "id": "2727806d", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "53.52266521026762" + ] + }, + "execution_count": 147, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "EdT1=ma.sum()\n", + "ma\n", + "ma[ma.index > 27].sum()\n", + "ma[ma.index > 27].sum()[0]/ma.sum()[0]*100\n", + "\n", + "# len(df1)\n" + ] + }, + { + "cell_type": "code", + "execution_count": 148, + "id": "c56131b0", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "universidad del salvador\n", + "25 202\n" + ] + } + ], + "source": [ + "ma=df2.university.groupby(df2.age).describe()\n", + "\n", + "# dat['count'].unique()\n", + "f =ma['count'] == ma['count'].max()\n", + "name_L=ma[f].index[0]\n", + "# loca =df1.location == ma[f].index[0]\n", + "name_L\n", + "print(df2.university[0])\n", + "print(name_L, ma['count'].max())" + ] + }, + { + "cell_type": "code", + "execution_count": 149, + "id": "e55edee8", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
countuniquetopfreq
age
171231universidad del salvador123
18281universidad del salvador28
191601universidad del salvador160
20201universidad del salvador20
211171universidad del salvador117
22191universidad del salvador19
231791universidad del salvador179
24511universidad del salvador51
252021universidad del salvador202
26531universidad del salvador53
271751universidad del salvador175
291191universidad del salvador119
311321universidad del salvador132
331371universidad del salvador137
351211universidad del salvador121
371451universidad del salvador145
391231universidad del salvador123
\n", + "
" + ], + "text/plain": [ + " count unique top freq\n", + "age \n", + "17 123 1 universidad del salvador 123\n", + "18 28 1 universidad del salvador 28\n", + "19 160 1 universidad del salvador 160\n", + "20 20 1 universidad del salvador 20\n", + "21 117 1 universidad del salvador 117\n", + "22 19 1 universidad del salvador 19\n", + "23 179 1 universidad del salvador 179\n", + "24 51 1 universidad del salvador 51\n", + "25 202 1 universidad del salvador 202\n", + "26 53 1 universidad del salvador 53\n", + "27 175 1 universidad del salvador 175\n", + "29 119 1 universidad del salvador 119\n", + "31 132 1 universidad del salvador 132\n", + "33 137 1 universidad del salvador 137\n", + "35 121 1 universidad del salvador 121\n", + "37 145 1 universidad del salvador 145\n", + "39 123 1 universidad del salvador 123" + ] + }, + "execution_count": 149, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "EdadT2=ma.sum()\n", + "ma" + ] + }, + { + "cell_type": "code", + "execution_count": 150, + "id": "0ada37ea", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "40.80882352941176" + ] + }, + "execution_count": 150, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "ma[ma.index > 27].sum()[0]/ma.sum()[0]*100" + ] + }, + { + "cell_type": "code", + "execution_count": 151, + "id": "60284dc0", + "metadata": {}, + "outputs": [], + "source": [ + "# ma=df1.university.groupby(df1.location).describe()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "7fe7a293", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": 152, + "id": "6cbf6573", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "73" + ] + }, + "execution_count": 152, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df2.university.groupby(df2.career).count().max()" + ] + }, + { + "cell_type": "markdown", + "id": "c3bbb734", + "metadata": {}, + "source": [ + "# Conclusión\n", + "\n", + "- La mayor parte de la población inscrita entre 2020-09-01 e inicios 2021-02-01, es de mujeres con un 52% para la universidad del Salvador, a diferencia de la universidad comanhue donde su mayor población es de hombres con un 51%, la universidad del salvador solo tiene 73 personas inscritas mas que la universidad de comenhue equivalente a un 4 % aproximadamente, \n", + "- La edad promedio de los inscritos se encuentra entre los 27 y 28 años, aunque la mayor cantidad de inscritos en el periodo de tiempo establecido tienen la edad de 23 años para ambas universidades, la edad minima esta en 17 años y la maxima en 40 años, además la universidad de comenhue tiene su mayor población mayor a 27 años con un valor del 50% a diferencia de la universidad del salvador con un 40.5 % , por tanto la universidad del salvador tiene personas más jovenes.\n", + "- La mayor población que provienen de una misma localidad es de 12 para la universidad de comahue para la localidad de 25 de mayo, y de 10 para la universidad del Salvador para la localidad agua colorada, al realizar las gráficas realizadas al dataset general, se observo que el mismo comportamiento para el genero de inscripciones tomando la tendencia general de los datos, la elección de carrera presenta gran variedad por localidad ,edad, y genero como se observa en el grafíco que relaciona la edad, carrera y genero." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "08c53a16", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "adc1a753", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "67a87854", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "ee86c7ab", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "24c79477", + "metadata": {}, + "outputs": [], + "source": [] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.8.8" + }, + "vscode": { + "interpreter": { + "hash": "ff0d91300876931207232d01add3156fa7c8214350996c757a3c6cebc4b3b5d5" + } + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git a/dags/ETL_configGrupoB.yml b/dags/ETL_configGrupoB.yml new file mode 100644 index 00000000..ad0c12e5 --- /dev/null +++ b/dags/ETL_configGrupoB.yml @@ -0,0 +1,55 @@ + +default: + default_args: + owner: "BROC95" + start_date: 2018-03-01 + # end_date: 2018-03-05 + retries: 1 + retry_delay_sec: 300 + concurrency: 1 + max_active_runs: 1 + dagrun_timeout_sec: 600 + default_view: "tree" + orientation: "LR" + schedule_interval: "@daily" + + + + +ETL_dag: + tasks: + + Extract_B1: + operator: airflow.operators.python.PythonOperator + + python_callable_name: 'extract' + python_callable_file: /usr/local/airflow/dags/GBUNComahue_dag_elt.py + + Transform_B1: + operator: airflow.operators.python.PythonOperator + python_callable_name: 'transform' + python_callable_file: /usr/local/airflow/dags/GBUNComahue_dag_elt.py + dependencies: [Extract_B1] + Load_B1: + operator: airflow.operators.python.PythonOperator + python_callable_name: 'load' + python_callable_file: /usr/local/airflow/dags/GBUNComahue_dag_elt.py + dependencies: [Transform_B1] + + Extract_B2: + operator: airflow.operators.python.PythonOperator + python_callable_name: 'extract' + python_callable_file: /usr/local/airflow/dags/GBUNSalvador_dag_elt.py + + Transform_B2: + operator: airflow.operators.python.PythonOperator + python_callable_name: 'extract' + python_callable_file: /usr/local/airflow/dags/GBUNSalvador_dag_elt.py + dependencies: [Extract_B2] + Load_B2: + operator: airflow.operators.python.PythonOperator + python_callable_name: 'load' + python_callable_file: /usr/local/airflow/dags/GBUNSalvador_dag_elt.py + dependencies: [Transform_B2] + + diff --git a/dags/GBUNComahue_dag_elt.py b/dags/GBUNComahue_dag_elt.py new file mode 100644 index 00000000..42ed4fc5 --- /dev/null +++ b/dags/GBUNComahue_dag_elt.py @@ -0,0 +1,128 @@ + +# BROC95 +from plugins.sqlCommandB import csvFile, identExt +from plugins.connectionDag import configDag, configLog +from plugins.dataTrasB import data_transform +from datetime import datetime, timedelta +from plugins.sqlCommandB import sqlCommand, createPath +import json +import pandas as pd +from airflow import DAG +from airflow.operators.python import PythonOperator +import logging +from sqlalchemy import create_engine +import logging.config +import os +from airflow.providers.postgres.hooks.postgres import PostgresHook +import logging +import boto3 +from botocore.exceptions import ClientError + +name_data = 'GBUNComahue' + + +dag_name = '_dag_elt' +selec = "_select.csv" +sql_ = ".sql" +process = "_process.txt" + +dag_ = name_data+dag_name +query_name = name_data+sql_ +select_name = name_data+selec +process_name = name_data+process + + +default_args, POSTGRES_CONN_ID, ACCESS_KEY, SECRET_ACCESS_KEY, AWS_S3_CONN_ID, BUCKET = configDag() + + +# Extract data with hook,pandas .csv + +def extract(): + + logger = configLog(dag_) + + logger.info(dag_) + logger.info("Extract") + logger.info("Connect: % s", POSTGRES_CONN_ID) + + hook = PostgresHook(postgres_conn_id=POSTGRES_CONN_ID) + + query = sqlCommand( + file=query_name, point='include') + conn = hook.get_conn() + # logging.info(conn) + + df = hook.get_pandas_df(sql=query) + + logger.info(df.head()) + pathCsv = createPath('files') + # pathCsv = createPath('include') # Correccion a guardar localmente + + js = df.to_json(orient='columns') + # print("Create csv") + df.to_csv(pathCsv+'/'+select_name) + conn.close() + + +# Transform data with pandas + +def transform(): + logger = configLog(dag_) + logger.info("Transform") + + pathfile = createPath('files') + + fileSelect = csvFile(pathfile, select_name) + + data_transform(fileSelect) + + # print(POSTGRES_CONN_ID) + + +# Load data with S3 amazon .txt + +def load(): + logger = configLog(dag_) + logger.info("Load: %s", dag_) + logger.info("Connect: % s", AWS_S3_CONN_ID) + + # def upload_file(file_name, bucket, object_name): + """Upload a file to an S3 bucket + + :param file_name: File to upload + :param bucket: Bucket to upload to + :param object_name: S3 object name. If not specified then file_name is used + :return: True if file was uploaded, else False + """ + dest_file_path = createPath('datasets') + file_name = dest_file_path+'/' + process_name + bucket = BUCKET + object_name = process_name + + session = boto3.Session( + aws_access_key_id=ACCESS_KEY, + aws_secret_access_key=SECRET_ACCESS_KEY, + ) + # client = session.client("s3") + s3_client = session.client('s3') + try: + response = s3_client.upload_file(file_name, bucket, object_name) + except ClientError as e: + logger.error(e) + return False + return True + + +with DAG(dag_id=dag_, start_date=datetime(2022, 11, 4), schedule_interval=timedelta(hours=1), default_args=default_args, catchup=False) as dag: + # Extract + task1 = PythonOperator(task_id="TaskExtract", + python_callable=extract) + # Transform + task2 = PythonOperator(task_id="TaskTransform", + python_callable=transform) + # Load + task3 = PythonOperator(task_id="TaskLoad", + python_callable=load) + +task1 >> task2 >> task3 +# task1 \ No newline at end of file diff --git a/dags/GBUNSalvador_dag_elt.py b/dags/GBUNSalvador_dag_elt.py new file mode 100644 index 00000000..b811ac9c --- /dev/null +++ b/dags/GBUNSalvador_dag_elt.py @@ -0,0 +1,128 @@ + +# BROC95 +from plugins.sqlCommandB import csvFile, identExt +from plugins.connectionDag import configDag, configLog +from plugins.dataTrasB import data_transform +from datetime import datetime, timedelta +from plugins.sqlCommandB import sqlCommand, createPath +import json +import pandas as pd +from airflow import DAG +from airflow.operators.python import PythonOperator +import logging +from sqlalchemy import create_engine +import logging.config +import os +from airflow.providers.postgres.hooks.postgres import PostgresHook +import logging +import boto3 +from botocore.exceptions import ClientError + +name_data = 'GBUNSalvador' + + +dag_name = '_dag_elt' +selec = "_select.csv" +sql_ = ".sql" +process = "_process.txt" + +dag_ = name_data+dag_name +query_name = name_data+sql_ +select_name = name_data+selec +process_name = name_data+process + + +default_args, POSTGRES_CONN_ID, ACCESS_KEY, SECRET_ACCESS_KEY, AWS_S3_CONN_ID, BUCKET = configDag() + + +# Extract data with hook,pandas .csv + +def extract(): + + logger = configLog(dag_) + + logger.info(dag_) + logger.info("Extract") + logger.info("Connect: % s", POSTGRES_CONN_ID) + + hook = PostgresHook(postgres_conn_id=POSTGRES_CONN_ID) + + query = sqlCommand( + file=query_name, point='include') + conn = hook.get_conn() + # logging.info(conn) + + df = hook.get_pandas_df(sql=query) + + logger.info(df.head()) + pathCsv = createPath('files') + # pathCsv = createPath('include') # Correccion a guardar localmente + + js = df.to_json(orient='columns') + # print("Create csv") + df.to_csv(pathCsv+'/'+select_name) + conn.close() + + +# Transform data with pandas + +def transform(): + logger = configLog(dag_) + logger.info("Transform") + + pathfile = createPath('files') + + fileSelect = csvFile(pathfile, select_name) + + data_transform(fileSelect) + + # print(POSTGRES_CONN_ID) + + +# Load data with S3 amazon .txt + +def load(): + logger = configLog(dag_) + logger.info("Load: %s", dag_) + logger.info("Connect: % s", AWS_S3_CONN_ID) + + # def upload_file(file_name, bucket, object_name): + """Upload a file to an S3 bucket + + :param file_name: File to upload + :param bucket: Bucket to upload to + :param object_name: S3 object name. If not specified then file_name is used + :return: True if file was uploaded, else False + """ + dest_file_path = createPath('datasets') + file_name = dest_file_path+'/' + process_name + bucket = BUCKET + object_name = process_name + + session = boto3.Session( + aws_access_key_id=ACCESS_KEY, + aws_secret_access_key=SECRET_ACCESS_KEY, + ) + # client = session.client("s3") + s3_client = session.client('s3') + try: + response = s3_client.upload_file(file_name, bucket, object_name) + except ClientError as e: + logger.error(e) + return False + return True + + +with DAG(dag_id=dag_, start_date=datetime(2022, 11, 4), schedule_interval=timedelta(hours=1), default_args=default_args, catchup=False) as dag: + # Extract + task1 = PythonOperator(task_id="TaskExtract", + python_callable=extract) + # Transform + task2 = PythonOperator(task_id="TaskTransform", + python_callable=transform) + # Load + task3 = PythonOperator(task_id="TaskLoad", + python_callable=load) + +task1 >> task2 >> task3 +# task1 \ No newline at end of file diff --git a/dags/dags_dynamic/grupoB/Temp_UNDag.jinja2 b/dags/dags_dynamic/grupoB/Temp_UNDag.jinja2 new file mode 100644 index 00000000..3be548bc --- /dev/null +++ b/dags/dags_dynamic/grupoB/Temp_UNDag.jinja2 @@ -0,0 +1,128 @@ + +# BROC95 +from plugins.sqlCommandB import csvFile, identExt +from plugins.connectionDag import configDag, configLog +from plugins.dataTrasB import data_transform +from datetime import datetime, timedelta +from plugins.sqlCommandB import sqlCommand, createPath +import json +import pandas as pd +from airflow import DAG +from airflow.operators.python import PythonOperator +import logging +from sqlalchemy import create_engine +import logging.config +import os +from airflow.providers.postgres.hooks.postgres import PostgresHook +import logging +import boto3 +from botocore.exceptions import ClientError + +name_data = '{{name_dag}}' + + +dag_name = '_dag_elt' +selec = "_select.csv" +sql_ = ".sql" +process = "_process.txt" + +dag_ = name_data+dag_name +query_name = name_data+sql_ +select_name = name_data+selec +process_name = name_data+process + + +default_args, POSTGRES_CONN_ID, ACCESS_KEY, SECRET_ACCESS_KEY, AWS_S3_CONN_ID, BUCKET = configDag() + + +# Extract data with hook,pandas .csv + +def extract(): + + logger = configLog(dag_) + + logger.info(dag_) + logger.info("Extract") + logger.info("Connect: % s", POSTGRES_CONN_ID) + + hook = PostgresHook(postgres_conn_id=POSTGRES_CONN_ID) + + query = sqlCommand( + file=query_name, point='include') + conn = hook.get_conn() + # logging.info(conn) + + df = hook.get_pandas_df(sql=query) + + logger.info(df.head()) + pathCsv = createPath('files') + # pathCsv = createPath('include') # Correccion a guardar localmente + + js = df.to_json(orient='columns') + # print("Create csv") + df.to_csv(pathCsv+'/'+select_name) + conn.close() + + +# Transform data with pandas + +def transform(): + logger = configLog(dag_) + logger.info("Transform") + + pathfile = createPath('files') + + fileSelect = csvFile(pathfile, select_name) + + data_transform(fileSelect) + + # print(POSTGRES_CONN_ID) + + +# Load data with S3 amazon .txt + +def load(): + logger = configLog(dag_) + logger.info("Load: %s", dag_) + logger.info("Connect: % s", AWS_S3_CONN_ID) + + # def upload_file(file_name, bucket, object_name): + """Upload a file to an S3 bucket + + :param file_name: File to upload + :param bucket: Bucket to upload to + :param object_name: S3 object name. If not specified then file_name is used + :return: True if file was uploaded, else False + """ + dest_file_path = createPath('datasets') + file_name = dest_file_path+'/' + process_name + bucket = BUCKET + object_name = process_name + + session = boto3.Session( + aws_access_key_id=ACCESS_KEY, + aws_secret_access_key=SECRET_ACCESS_KEY, + ) + # client = session.client("s3") + s3_client = session.client('s3') + try: + response = s3_client.upload_file(file_name, bucket, object_name) + except ClientError as e: + logger.error(e) + return False + return True + + +with DAG(dag_id=dag_, start_date=datetime(2022, 11, 4), schedule_interval=timedelta(hours={{schedule_interval}}), default_args=default_args, catchup={{catchup or False}}) as dag: + # Extract + task1 = PythonOperator(task_id="TaskExtract", + python_callable=extract) + # Transform + task2 = PythonOperator(task_id="TaskTransform", + python_callable=transform) + # Load + task3 = PythonOperator(task_id="TaskLoad", + python_callable=load) + +task1 >> task2 >> task3 +# task1 diff --git a/dags/dags_dynamic/grupoB/config_GBUNComahue.yaml b/dags/dags_dynamic/grupoB/config_GBUNComahue.yaml new file mode 100644 index 00000000..07a43fd5 --- /dev/null +++ b/dags/dags_dynamic/grupoB/config_GBUNComahue.yaml @@ -0,0 +1,3 @@ +name_dag: "GBUNComahue" +schedule_interval: 1 +catchup: False \ No newline at end of file diff --git a/dags/dags_dynamic/grupoB/config_GBUNSalvador.yaml b/dags/dags_dynamic/grupoB/config_GBUNSalvador.yaml new file mode 100644 index 00000000..3c285747 --- /dev/null +++ b/dags/dags_dynamic/grupoB/config_GBUNSalvador.yaml @@ -0,0 +1,3 @@ +name_dag: "GBUNSalvador" +schedule_interval: 1 +catchup: False \ No newline at end of file diff --git a/dags/dags_dynamic/grupoB/generatorGB.py b/dags/dags_dynamic/grupoB/generatorGB.py new file mode 100644 index 00000000..e3ef26c4 --- /dev/null +++ b/dags/dags_dynamic/grupoB/generatorGB.py @@ -0,0 +1,15 @@ +from jinja2 import Environment, FileSystemLoader +import yaml +import os + +file_dir = os.path.dirname(os.path.abspath(__file__)) +env = Environment(loader=FileSystemLoader(file_dir)) + +tempate = env.get_or_select_template('Temp_UNDag.jinja2') +dag_name = '_dag_elt' +for filename in os.listdir(file_dir): + if filename.endswith(".yaml"): + with open(f"{file_dir}/{filename}",'r') as cong: + config = yaml.safe_load(cong) + with open(f"dags/{config['name_dag']}{dag_name}.py", "w") as f: + f.write(tempate.render(config)) \ No newline at end of file diff --git a/dags/factoryGB.py b/dags/factoryGB.py new file mode 100644 index 00000000..8753edc7 --- /dev/null +++ b/dags/factoryGB.py @@ -0,0 +1,14 @@ + +from airflow import DAG +import dagfactory + + +config_file = "/usr/local/airflow/dags/ETL_configGrupoB.yml" +example_dag_factory = dagfactory.DagFactory(config_file) +# Creating task dependencies + +example_dag_factory.clean_dags(globals()) + +example_dag_factory.generate_dags(globals()) + + diff --git "a/dags/logs/dag_id=ETL_dag/run_id=manual__2022-11-10T14\357\200\27246\357\200\27255.572752+00\357\200\27200/task_id=ETL/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=manual__2022-11-10T14\357\200\27246\357\200\27255.572752+00\357\200\27200/task_id=ETL/attempt=1.log" new file mode 100644 index 00000000..01ef044d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=manual__2022-11-10T14\357\200\27246\357\200\27255.572752+00\357\200\27200/task_id=ETL/attempt=1.log" @@ -0,0 +1,31 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T14:47:58.056370Z", "eventType": "START", "inputs": [], "job": {"facets": {"documentation": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/DocumentationJobFacet", "description": "this is an ETL dag!"}}, "name": "ETL_dag.ETL", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-01-01T00:00:00+00:00", "task_id": "ETL"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Extract_B1', 'Extract_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-01-01T00:00:00+00:00", "task_group": "", "task_id": "ETL", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T14:46:55.572752Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c875c6a8-3547-37e7-9172-3a00e7533021"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c875c6a8-3547-37e7-9172-3a00e7533021"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "ETL"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "ETL", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1cc3f01d-6cc8-4f78-9d74-46d645ff2f89"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=ETL, dagrun_id=manual__2022-11-10T14:46:55.572752+00:00, map_index=-1, run_start_date=2022-11-10 14:47:58.056370+00:00, try_number=1, job_id=10, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 14:46:55.572752+00:00 +INFO - Started process 191 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'ETL', 'manual__2022-11-10T14:46:55.572752+00:00', '--job-id', '10', '--raw', '--subdir', 'DAGS_FOLDER/dag_factory/factory.py', '--cfg-path', '/tmp/tmpeadwofty'] +INFO - Job 10: Subtask ETL +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host b33e9ad29d64 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=ETL +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T14:46:55.572752+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T14:46:55.572752+00:00 +INFO - Init process ETL Alkemy +INFO - Broc95 +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=ETL, execution_date=20221110T144655, start_date=20221110T144758, end_date=20221110T144758 +INFO - {"eventTime": "2022-11-10T14:47:58.938538Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.ETL", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "ETL"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "ETL", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1cc3f01d-6cc8-4f78-9d74-46d645ff2f89"}} +INFO - Task exited with return code 0 +INFO - 2 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=manual__2022-11-10T14\357\200\27246\357\200\27255.572752+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=manual__2022-11-10T14\357\200\27246\357\200\27255.572752+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..29b16895 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=manual__2022-11-10T14\357\200\27246\357\200\27255.572752+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,47 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T14:48:00.672151Z", "eventType": "START", "inputs": [], "job": {"facets": {"documentation": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/DocumentationJobFacet", "description": "this is an ETL dag!"}}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-01-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-01-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'ETL'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T14:46:55.572752Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c875c6a8-3547-37e7-9172-3a00e7533021"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c875c6a8-3547-37e7-9172-3a00e7533021"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d35c67bf-9d37-4ef4-80eb-efe6dae908f8"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=manual__2022-11-10T14:46:55.572752+00:00, map_index=-1, run_start_date=2022-11-10 14:48:00.672151+00:00, try_number=1, job_id=12, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 14:46:55.572752+00:00 +INFO - Started process 200 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'manual__2022-11-10T14:46:55.572752+00:00', '--job-id', '12', '--raw', '--subdir', 'DAGS_FOLDER/dag_factory/factory.py', '--cfg-path', '/tmp/tmps3kl8yhz'] +INFO - Job 12: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host b33e9ad29d64 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T14:46:55.572752+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T14:46:55.572752+00:00 +INFO - '2022-11-10' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-10' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-10' - GBUNComahue_dag_elt - Connect: alkemy_db +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNComahue_dag_elt.py", line 52, in extract + conn = hook.get_conn() + File "/usr/local/lib/python3.9/site-packages/airflow/providers/postgres/hooks/postgres.py", line 88, in get_conn + conn = deepcopy(self.connection or self.get_connection(conn_id)) + File "/usr/local/lib/python3.9/site-packages/airflow/hooks/base.py", line 70, in get_connection + conn = Connection.get_connection_from_secrets(conn_id) + File "/usr/local/lib/python3.9/site-packages/airflow/models/connection.py", line 432, in get_connection_from_secrets + raise AirflowNotFoundException(f"The conn_id `{conn_id}` isn't defined") +airflow.exceptions.AirflowNotFoundException: The conn_id `alkemy_db` isn't defined +INFO - Marking task as UP_FOR_RETRY. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20221110T144655, start_date=20221110T144800, end_date=20221110T144802 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 12 for task Extract_B1 (The conn_id `alkemy_db` isn't defined; 200) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=manual__2022-11-10T14\357\200\27246\357\200\27255.572752+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=manual__2022-11-10T14\357\200\27246\357\200\27255.572752+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..06d8fb8b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=manual__2022-11-10T14\357\200\27246\357\200\27255.572752+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,47 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T14:48:00.660488Z", "eventType": "START", "inputs": [], "job": {"facets": {"documentation": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/DocumentationJobFacet", "description": "this is an ETL dag!"}}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-01-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-01-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'ETL'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T14:46:55.572752Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c875c6a8-3547-37e7-9172-3a00e7533021"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c875c6a8-3547-37e7-9172-3a00e7533021"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2d3e8dad-9d31-42fe-9aff-e39f16f760d9"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=manual__2022-11-10T14:46:55.572752+00:00, map_index=-1, run_start_date=2022-11-10 14:48:00.660488+00:00, try_number=1, job_id=11, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 14:46:55.572752+00:00 +INFO - Started process 199 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'manual__2022-11-10T14:46:55.572752+00:00', '--job-id', '11', '--raw', '--subdir', 'DAGS_FOLDER/dag_factory/factory.py', '--cfg-path', '/tmp/tmp60t8d0c3'] +INFO - Job 11: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host b33e9ad29d64 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T14:46:55.572752+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T14:46:55.572752+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: alkemy_db +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNSalvador_dag_elt.py", line 52, in extract + conn = hook.get_conn() + File "/usr/local/lib/python3.9/site-packages/airflow/providers/postgres/hooks/postgres.py", line 88, in get_conn + conn = deepcopy(self.connection or self.get_connection(conn_id)) + File "/usr/local/lib/python3.9/site-packages/airflow/hooks/base.py", line 70, in get_connection + conn = Connection.get_connection_from_secrets(conn_id) + File "/usr/local/lib/python3.9/site-packages/airflow/models/connection.py", line 432, in get_connection_from_secrets + raise AirflowNotFoundException(f"The conn_id `{conn_id}` isn't defined") +airflow.exceptions.AirflowNotFoundException: The conn_id `alkemy_db` isn't defined +INFO - Marking task as UP_FOR_RETRY. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20221110T144655, start_date=20221110T144800, end_date=20221110T144802 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 11 for task Extract_B2 (The conn_id `alkemy_db` isn't defined; 199) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=manual__2022-11-11T00\357\200\27223\357\200\27202.335840+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=manual__2022-11-11T00\357\200\27223\357\200\27202.335840+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..8dc0e583 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=manual__2022-11-11T00\357\200\27223\357\200\27202.335840+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:23:38.851342Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-11T00:23:02.335840Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ccb7b71a-65a6-35d0-861d-74f33948e7bf"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ccb7b71a-65a6-35d0-861d-74f33948e7bf"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5de08e95-147c-4c37-88fe-afcebb620fea"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=manual__2022-11-11T00:23:02.335840+00:00, map_index=-1, run_start_date=2022-11-11 00:23:38.851342+00:00, try_number=1, job_id=54, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-11 00:23:02.335840+00:00 +INFO - Started process 228 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'manual__2022-11-11T00:23:02.335840+00:00', '--job-id', '54', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpt80r2nas'] +INFO - Job 54: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2022-11-11T00:23:02.335840+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-11T00:23:02.335840+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20221111T002302, start_date=20221111T002338, end_date=20221111T002342 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=manual__2022-11-11T00:23:02.335840+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:23:42.418514Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5de08e95-147c-4c37-88fe-afcebb620fea"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=manual__2022-11-11T00\357\200\27223\357\200\27202.335840+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=manual__2022-11-11T00\357\200\27223\357\200\27202.335840+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..43972b6a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=manual__2022-11-11T00\357\200\27223\357\200\27202.335840+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:23:38.694174Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-11T00:23:02.335840Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ccb7b71a-65a6-35d0-861d-74f33948e7bf"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ccb7b71a-65a6-35d0-861d-74f33948e7bf"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4665c8a6-c526-428e-9978-583e7df90752"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=manual__2022-11-11T00:23:02.335840+00:00, map_index=-1, run_start_date=2022-11-11 00:23:38.694174+00:00, try_number=1, job_id=53, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-11 00:23:02.335840+00:00 +INFO - Started process 225 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'manual__2022-11-11T00:23:02.335840+00:00', '--job-id', '53', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpqgchn6lb'] +INFO - Job 53: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2022-11-11T00:23:02.335840+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-11T00:23:02.335840+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20221111T002302, start_date=20221111T002338, end_date=20221111T002341 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=manual__2022-11-11T00:23:02.335840+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:23:41.999977Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4665c8a6-c526-428e-9978-583e7df90752"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=manual__2022-11-11T00\357\200\27223\357\200\27202.335840+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=manual__2022-11-11T00\357\200\27223\357\200\27202.335840+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..a8a27674 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=manual__2022-11-11T00\357\200\27223\357\200\27202.335840+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:23:57.545090Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-11T00:23:02.335840Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ccb7b71a-65a6-35d0-861d-74f33948e7bf"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ccb7b71a-65a6-35d0-861d-74f33948e7bf"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d3d824f5-d1c0-4816-90a5-89c7c9b4ef1a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=manual__2022-11-11T00:23:02.335840+00:00, map_index=-1, run_start_date=2022-11-11 00:23:57.545090+00:00, try_number=1, job_id=58, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-11 00:23:02.335840+00:00 +INFO - Started process 223 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'manual__2022-11-11T00:23:02.335840+00:00', '--job-id', '58', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp1qitrsvd'] +INFO - Job 58: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2022-11-11T00:23:02.335840+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-11T00:23:02.335840+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4f9f940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'GGwX9JEusonfv8FuP45eyQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:GGwX9JEusonfv8FuP45eyQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002358Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002358Z +20221111/us-east-1/s3/aws4_request +820a377e4e3fb5477ee70b7e258be3721504b0c9fdff7c9b3313b8b8ffa5e882 +INFO - '2022-11-11' - botocore.auth - Signature: +5f7b4700f15d239c4c4053c8ee41e6df1c828ca4281d952e004ae367bff5c960 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'VHkCX3LtCe8lauv1twpV9x+5gbjmBCOsX0XnyeOV6VWvSkSBAOqm3okAZRPPtNG6YbrfNahTltI=', 'x-amz-request-id': '6AKBQJPXTRN2EY3M', 'Date': 'Fri, 11 Nov 2022 00:23:59 GMT', 'ETag': '"186c17f4912eb289dfbfc16e3f8e5ec9"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20221111T002302, start_date=20221111T002357, end_date=20221111T002400 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=manual__2022-11-11T00:23:02.335840+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:24:00.201712Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d3d824f5-d1c0-4816-90a5-89c7c9b4ef1a"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=manual__2022-11-11T00\357\200\27223\357\200\27202.335840+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=manual__2022-11-11T00\357\200\27223\357\200\27202.335840+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..c7f6cacb --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=manual__2022-11-11T00\357\200\27223\357\200\27202.335840+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:23:51.147532Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-11T00:23:02.335840Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ccb7b71a-65a6-35d0-861d-74f33948e7bf"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ccb7b71a-65a6-35d0-861d-74f33948e7bf"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1f38a2d5-7209-4f96-8784-99c8bcb454ac"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=manual__2022-11-11T00:23:02.335840+00:00, map_index=-1, run_start_date=2022-11-11 00:23:51.147532+00:00, try_number=1, job_id=57, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-11 00:23:02.335840+00:00 +INFO - Started process 234 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'manual__2022-11-11T00:23:02.335840+00:00', '--job-id', '57', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp3munxouo'] +INFO - Job 57: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2022-11-11T00:23:02.335840+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-11T00:23:02.335840+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499521f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002352Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002352Z +20221111/us-east-1/s3/aws4_request +9f1e65d340825a28ed2824d4fcd803c9c7898e115432abd1a673d41d2e5815af +INFO - '2022-11-11' - botocore.auth - Signature: +7dc688838dcfeb5bf7f026ea48a9d6af1aa9a5c90225ccb2b4707bdef42a2d36 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'oZ60LAoeRwXXvdQtR22nE9BaTTVWown1STBr/fXrcofawuiPwApFZGX+CfWc9S4glEuu2TN/BJ4=', 'x-amz-request-id': 'N4W1X7PZCS7F0FVW', 'Date': 'Fri, 11 Nov 2022 00:23:52 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20221111T002302, start_date=20221111T002351, end_date=20221111T002353 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=manual__2022-11-11T00:23:02.335840+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:23:53.705100Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1f38a2d5-7209-4f96-8784-99c8bcb454ac"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=manual__2022-11-11T00\357\200\27223\357\200\27202.335840+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=manual__2022-11-11T00\357\200\27223\357\200\27202.335840+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..1a11b9f2 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=manual__2022-11-11T00\357\200\27223\357\200\27202.335840+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:23:46.157586Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-11T00:23:02.335840Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ccb7b71a-65a6-35d0-861d-74f33948e7bf"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ccb7b71a-65a6-35d0-861d-74f33948e7bf"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0a3d7d2c-b52f-449e-b432-7543846b884e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=manual__2022-11-11T00:23:02.335840+00:00, map_index=-1, run_start_date=2022-11-11 00:23:46.157586+00:00, try_number=1, job_id=56, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-11 00:23:02.335840+00:00 +INFO - Started process 217 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'manual__2022-11-11T00:23:02.335840+00:00', '--job-id', '56', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp7d9m1gk4'] +INFO - Job 56: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2022-11-11T00:23:02.335840+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-11T00:23:02.335840+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20221111T002302, start_date=20221111T002346, end_date=20221111T002354 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=manual__2022-11-11T00:23:02.335840+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:23:54.582286Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0a3d7d2c-b52f-449e-b432-7543846b884e"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=manual__2022-11-11T00\357\200\27223\357\200\27202.335840+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=manual__2022-11-11T00\357\200\27223\357\200\27202.335840+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..692c5bfa --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=manual__2022-11-11T00\357\200\27223\357\200\27202.335840+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:23:44.384588Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-11T00:23:02.335840Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ccb7b71a-65a6-35d0-861d-74f33948e7bf"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ccb7b71a-65a6-35d0-861d-74f33948e7bf"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "58fa7b12-b933-42c3-9471-2ebe54e11fe2"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=manual__2022-11-11T00:23:02.335840+00:00, map_index=-1, run_start_date=2022-11-11 00:23:44.384588+00:00, try_number=1, job_id=55, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-11 00:23:02.335840+00:00 +INFO - Started process 214 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'manual__2022-11-11T00:23:02.335840+00:00', '--job-id', '55', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpqrkwhcw0'] +INFO - Job 55: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2022-11-11T00:23:02.335840+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-11T00:23:02.335840+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20221111T002302, start_date=20221111T002344, end_date=20221111T002347 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=manual__2022-11-11T00:23:02.335840+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:23:47.779628Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "58fa7b12-b933-42c3-9471-2ebe54e11fe2"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-01-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=ETL/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-01-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=ETL/attempt=1.log" new file mode 100644 index 00000000..aae9cb1c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-01-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=ETL/attempt=1.log" @@ -0,0 +1,31 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T14:46:58.441008Z", "eventType": "START", "inputs": [], "job": {"facets": {"documentation": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/DocumentationJobFacet", "description": "this is an ETL dag!"}}, "name": "ETL_dag.ETL", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-01-01T00:00:00+00:00", "task_id": "ETL"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Extract_B1', 'Extract_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-01-01T00:00:00+00:00", "task_group": "", "task_id": "ETL", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-01-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "00655584-8852-33ef-b129-cb17c44600a7"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "00655584-8852-33ef-b129-cb17c44600a7"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "ETL"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "ETL", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "32e30a8b-cfc3-4847-8d86-a5d836bf067b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=ETL, dagrun_id=scheduled__2018-01-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-10 14:46:58.441008+00:00, try_number=1, job_id=7, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-01-01 00:00:00+00:00 +INFO - Started process 173 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'ETL', 'scheduled__2018-01-01T00:00:00+00:00', '--job-id', '7', '--raw', '--subdir', 'DAGS_FOLDER/dag_factory/factory.py', '--cfg-path', '/tmp/tmp1phh1t9c'] +INFO - Job 7: Subtask ETL +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host b33e9ad29d64 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=ETL +AIRFLOW_CTX_EXECUTION_DATE=2018-01-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-01-01T00:00:00+00:00 +INFO - Init process ETL Alkemy +INFO - Broc95 +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=ETL, execution_date=20180101T000000, start_date=20221110T144658, end_date=20221110T144659 +INFO - {"eventTime": "2022-11-10T14:46:59.669761Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.ETL", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "ETL"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "ETL", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "32e30a8b-cfc3-4847-8d86-a5d836bf067b"}} +INFO - Task exited with return code 0 +INFO - 2 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-01-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-01-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..04061d41 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-01-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,47 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T14:47:03.063537Z", "eventType": "START", "inputs": [], "job": {"facets": {"documentation": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/DocumentationJobFacet", "description": "this is an ETL dag!"}}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-01-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-01-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'ETL'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-01-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "00655584-8852-33ef-b129-cb17c44600a7"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "00655584-8852-33ef-b129-cb17c44600a7"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e8a02567-fd68-4da5-86da-239c36e294ff"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-01-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-10 14:47:03.063537+00:00, try_number=1, job_id=9, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-01-01 00:00:00+00:00 +INFO - Started process 182 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-01-01T00:00:00+00:00', '--job-id', '9', '--raw', '--subdir', 'DAGS_FOLDER/dag_factory/factory.py', '--cfg-path', '/tmp/tmpidrwzgye'] +INFO - Job 9: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host b33e9ad29d64 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-01-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-01-01T00:00:00+00:00 +INFO - '2022-11-10' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-10' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-10' - GBUNComahue_dag_elt - Connect: alkemy_db +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNComahue_dag_elt.py", line 52, in extract + conn = hook.get_conn() + File "/usr/local/lib/python3.9/site-packages/airflow/providers/postgres/hooks/postgres.py", line 88, in get_conn + conn = deepcopy(self.connection or self.get_connection(conn_id)) + File "/usr/local/lib/python3.9/site-packages/airflow/hooks/base.py", line 70, in get_connection + conn = Connection.get_connection_from_secrets(conn_id) + File "/usr/local/lib/python3.9/site-packages/airflow/models/connection.py", line 432, in get_connection_from_secrets + raise AirflowNotFoundException(f"The conn_id `{conn_id}` isn't defined") +airflow.exceptions.AirflowNotFoundException: The conn_id `alkemy_db` isn't defined +INFO - Marking task as UP_FOR_RETRY. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180101T000000, start_date=20221110T144703, end_date=20221110T144704 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 9 for task Extract_B1 (The conn_id `alkemy_db` isn't defined; 182) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-01-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-01-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..1ecc5c8d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-01-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,47 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T14:47:02.999051Z", "eventType": "START", "inputs": [], "job": {"facets": {"documentation": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/DocumentationJobFacet", "description": "this is an ETL dag!"}}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-01-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-01-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'ETL'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-01-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "00655584-8852-33ef-b129-cb17c44600a7"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "00655584-8852-33ef-b129-cb17c44600a7"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4a798c91-d4a6-49eb-8fd5-5bbc2172ab2c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-01-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-10 14:47:02.999051+00:00, try_number=1, job_id=8, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-01-01 00:00:00+00:00 +INFO - Started process 180 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-01-01T00:00:00+00:00', '--job-id', '8', '--raw', '--subdir', 'DAGS_FOLDER/dag_factory/factory.py', '--cfg-path', '/tmp/tmpwbmvul0y'] +INFO - Job 8: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host b33e9ad29d64 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-01-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-01-01T00:00:00+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: alkemy_db +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNSalvador_dag_elt.py", line 52, in extract + conn = hook.get_conn() + File "/usr/local/lib/python3.9/site-packages/airflow/providers/postgres/hooks/postgres.py", line 88, in get_conn + conn = deepcopy(self.connection or self.get_connection(conn_id)) + File "/usr/local/lib/python3.9/site-packages/airflow/hooks/base.py", line 70, in get_connection + conn = Connection.get_connection_from_secrets(conn_id) + File "/usr/local/lib/python3.9/site-packages/airflow/models/connection.py", line 432, in get_connection_from_secrets + raise AirflowNotFoundException(f"The conn_id `{conn_id}` isn't defined") +airflow.exceptions.AirflowNotFoundException: The conn_id `alkemy_db` isn't defined +INFO - Marking task as UP_FOR_RETRY. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180101T000000, start_date=20221110T144702, end_date=20221110T144704 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 8 for task Extract_B2 (The conn_id `alkemy_db` isn't defined; 180) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..1469a9bf --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:23:07.860288Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "37d357d1-1e17-3532-b6b6-4dd971685229"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "37d357d1-1e17-3532-b6b6-4dd971685229"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c250abab-7efe-40d2-837a-042f0d2d84ca"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-03-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:23:07.860288+00:00, try_number=1, job_id=47, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-01 00:00:00+00:00 +INFO - Started process 195 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-03-01T00:00:00+00:00', '--job-id', '47', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpgv3srzl8'] +INFO - Job 47: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180301T000000, start_date=20221111T002307, end_date=20221111T002312 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-03-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:23:12.951456Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c250abab-7efe-40d2-837a-042f0d2d84ca"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..786b5f64 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:23:07.875522Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "37d357d1-1e17-3532-b6b6-4dd971685229"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "37d357d1-1e17-3532-b6b6-4dd971685229"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6588a0c3-75c2-4d89-910c-1eb01f12d7c0"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-03-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:23:07.875522+00:00, try_number=1, job_id=48, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-01 00:00:00+00:00 +INFO - Started process 197 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-03-01T00:00:00+00:00', '--job-id', '48', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmps0nl6ns1'] +INFO - Job 48: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180301T000000, start_date=20221111T002307, end_date=20221111T002313 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-03-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:23:13.375694Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6588a0c3-75c2-4d89-910c-1eb01f12d7c0"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..49ffdbcb --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:23:33.203939Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "37d357d1-1e17-3532-b6b6-4dd971685229"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "37d357d1-1e17-3532-b6b6-4dd971685229"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "44dd9f31-9551-4e8a-b5f3-792898220da9"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-03-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:23:33.203939+00:00, try_number=1, job_id=52, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-01 00:00:00+00:00 +INFO - Started process 217 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-03-01T00:00:00+00:00', '--job-id', '52', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpcu3ki5lk'] +INFO - Job 52: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498efee0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '7iv/SU4SjszwXDIYo8+25A==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:7iv/SU4SjszwXDIYo8+25A== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002334Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002334Z +20221111/us-east-1/s3/aws4_request +b6999a8855775907a053ee9d324c919ab4801631360e62a3febad870a6f65f15 +INFO - '2022-11-11' - botocore.auth - Signature: +7d6d0c73fe86e98b02d8d36db5d3d03f075db8d120d52f7411df9f3e7e837c78 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'M4jI+mMP54QmsGqCmfMZ8A5ZFnmc0Pjv9ZlUQAlx0KhXXay/XJGZokedq5TVfxcmFT8QALJb/YQ=', 'x-amz-request-id': 'H9XSTATRBY925BRD', 'Date': 'Fri, 11 Nov 2022 00:23:34 GMT', 'ETag': '"ee2bff494e128eccf05c3218a3cfb6e4"', 'x-amzn-internal-status': '200', 'Content-Length': '0', 'Server': 'AmazonS3'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180301T000000, start_date=20221111T002333, end_date=20221111T002335 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-03-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:23:35.289217Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "44dd9f31-9551-4e8a-b5f3-792898220da9"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..9bc3274b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:23:28.084547Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "37d357d1-1e17-3532-b6b6-4dd971685229"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "37d357d1-1e17-3532-b6b6-4dd971685229"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3e50dcb0-4788-4f40-81d6-729182ce0f1f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-03-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:23:28.084547+00:00, try_number=1, job_id=51, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-01 00:00:00+00:00 +INFO - Started process 210 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-03-01T00:00:00+00:00', '--job-id', '51', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpsmzh5m4x'] +INFO - Job 51: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499513a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002330Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002330Z +20221111/us-east-1/s3/aws4_request +0cb3bb8879e9245cb60d5f9579f6c4272670fc26ca08c127f1ff061cb778c61a +INFO - '2022-11-11' - botocore.auth - Signature: +c6bf149844efe66c9d1590637ad81d3404b3ef70573d635bf240649fdfb9eb18 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'GHVxCtmCXDm4XgIXmMT8vPqZVbnMz0JC5bIV/M+TKR9dAaYrEfF0qK6yQ+skjm0YTcjjOAW5VQc=', 'x-amz-request-id': 'YPJFZ4ERACMNZA8N', 'Date': 'Fri, 11 Nov 2022 00:23:30 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180301T000000, start_date=20221111T002328, end_date=20221111T002331 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-03-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:23:31.597464Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3e50dcb0-4788-4f40-81d6-729182ce0f1f"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..1059ec34 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:23:18.234923Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "37d357d1-1e17-3532-b6b6-4dd971685229"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "37d357d1-1e17-3532-b6b6-4dd971685229"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "57514422-dce2-44cb-83a4-ef31c067db1f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-03-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:23:18.234923+00:00, try_number=1, job_id=49, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-01 00:00:00+00:00 +INFO - Started process 204 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-03-01T00:00:00+00:00', '--job-id', '49', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpj9oxnn0q'] +INFO - Job 49: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180301T000000, start_date=20221111T002318, end_date=20221111T002330 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-03-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:23:30.648405Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "57514422-dce2-44cb-83a4-ef31c067db1f"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..60ea25ef --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:23:18.666046Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "37d357d1-1e17-3532-b6b6-4dd971685229"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "37d357d1-1e17-3532-b6b6-4dd971685229"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "07e255c7-c100-4af0-8bb1-6fe1f25596b8"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-03-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:23:18.666046+00:00, try_number=1, job_id=50, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-01 00:00:00+00:00 +INFO - Started process 207 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-03-01T00:00:00+00:00', '--job-id', '50', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpv7bup9m3'] +INFO - Job 50: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180301T000000, start_date=20221111T002318, end_date=20221111T002324 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-03-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:23:24.271324Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "07e255c7-c100-4af0-8bb1-6fe1f25596b8"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..3979632a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:25:33.988431Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a7dee6dd-8ec9-3643-be7f-2851981a0b9d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a7dee6dd-8ec9-3643-be7f-2851981a0b9d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b0449e05-c28f-4ac4-abc2-4c6b61801b2c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-03-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:25:33.988431+00:00, try_number=1, job_id=60, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-02 00:00:00+00:00 +INFO - Started process 320 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-03-02T00:00:00+00:00', '--job-id', '60', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpzdnho_cn'] +INFO - Job 60: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180302T000000, start_date=20221111T002533, end_date=20221111T002536 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-03-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:25:36.528629Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b0449e05-c28f-4ac4-abc2-4c6b61801b2c"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..bb745799 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:25:33.960236Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a7dee6dd-8ec9-3643-be7f-2851981a0b9d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a7dee6dd-8ec9-3643-be7f-2851981a0b9d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7baaf72b-deb8-4594-87b9-9e5e7709fb5c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-03-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:25:33.960236+00:00, try_number=1, job_id=59, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-02 00:00:00+00:00 +INFO - Started process 318 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-03-02T00:00:00+00:00', '--job-id', '59', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpjnas4wxf'] +INFO - Job 59: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180302T000000, start_date=20221111T002533, end_date=20221111T002536 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-03-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:25:36.568018Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7baaf72b-deb8-4594-87b9-9e5e7709fb5c"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..c31e29f1 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:25:43.411868Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a7dee6dd-8ec9-3643-be7f-2851981a0b9d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a7dee6dd-8ec9-3643-be7f-2851981a0b9d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3e943dad-0ca9-42c1-b8cc-50630e0b9fe4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-03-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:25:43.411868+00:00, try_number=1, job_id=64, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-02 00:00:00+00:00 +INFO - Started process 342 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-03-02T00:00:00+00:00', '--job-id', '64', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp9wk7h1ua'] +INFO - Job 64: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '6YASFDY8y05PLtumphhjBA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:6YASFDY8y05PLtumphhjBA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002543Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002543Z +20221111/us-east-1/s3/aws4_request +56b2517d26a06352ad30315ddbcc39ca8a3f167febf471c4fa9309e47275870d +INFO - '2022-11-11' - botocore.auth - Signature: +0284640bd181ebd27589d7594fbc62f56b4bce31112b82107b2e2b3d3d23a117 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '+cQfKEG8HRCGzTlUlj+I06rEfne1nWSvkpP/J1tvY04zu9GVoYvZWv31CRl63RzKhucD9rgH01k=', 'x-amz-request-id': '1XHR173875RMXDVJ', 'Date': 'Fri, 11 Nov 2022 00:25:44 GMT', 'ETag': '"e9801214363ccb4e4f2edba6a6186304"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180302T000000, start_date=20221111T002543, end_date=20221111T002545 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-03-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:25:45.058444Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3e943dad-0ca9-42c1-b8cc-50630e0b9fe4"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..9d06145f --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:25:42.343355Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a7dee6dd-8ec9-3643-be7f-2851981a0b9d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a7dee6dd-8ec9-3643-be7f-2851981a0b9d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0855ac15-aad2-4a15-8cf6-d5a6aff9445e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-03-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:25:42.343355+00:00, try_number=1, job_id=63, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-02 00:00:00+00:00 +INFO - Started process 337 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-03-02T00:00:00+00:00', '--job-id', '63', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpn77quyhk'] +INFO - Job 63: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0ca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002543Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002543Z +20221111/us-east-1/s3/aws4_request +7d6ad88a763f84af696864fda1577c5012c1fa2274b9907bb257e30df1f95ad5 +INFO - '2022-11-11' - botocore.auth - Signature: +f35e1233237e5c356599e483ed61fd175128a3b4b50f44e3eb2e5bc5bc044769 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'MvHHKNAqEe0R6zdWz/Oz6SfOG7iPCgRL2RKpYi0SN4ZGohH8Hi/C3cQMWPIgsUALBDdmBVGP+Dk=', 'x-amz-request-id': 'RRS9GA0GP9XY9BV2', 'Date': 'Fri, 11 Nov 2022 00:25:43 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180302T000000, start_date=20221111T002542, end_date=20221111T002544 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-03-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:25:44.376639Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0855ac15-aad2-4a15-8cf6-d5a6aff9445e"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..ba9145e0 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:25:38.126313Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a7dee6dd-8ec9-3643-be7f-2851981a0b9d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a7dee6dd-8ec9-3643-be7f-2851981a0b9d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "68066eb4-19aa-4a59-9f8c-0850401c512c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-03-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:25:38.126313+00:00, try_number=1, job_id=61, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-02 00:00:00+00:00 +INFO - Started process 330 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-03-02T00:00:00+00:00', '--job-id', '61', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpvv6ric8k'] +INFO - Job 61: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180302T000000, start_date=20221111T002538, end_date=20221111T002541 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-03-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:25:41.805069Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "68066eb4-19aa-4a59-9f8c-0850401c512c"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..879e0c70 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:25:38.129656Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a7dee6dd-8ec9-3643-be7f-2851981a0b9d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a7dee6dd-8ec9-3643-be7f-2851981a0b9d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8cb306e6-1002-41ad-a769-438dd78534b9"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-03-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:25:38.129656+00:00, try_number=1, job_id=62, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-02 00:00:00+00:00 +INFO - Started process 329 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-03-02T00:00:00+00:00', '--job-id', '62', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpnu9f57dd'] +INFO - Job 62: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180302T000000, start_date=20221111T002538, end_date=20221111T002540 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-03-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:25:40.676351Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8cb306e6-1002-41ad-a769-438dd78534b9"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..7f80ffe0 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:25:47.397365Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ad23a99f-e792-3161-b5d5-8e5c13959c2c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ad23a99f-e792-3161-b5d5-8e5c13959c2c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e750abea-ba67-4a34-b976-f2b1e9133a3e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-03-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:25:47.397365+00:00, try_number=1, job_id=66, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-03 00:00:00+00:00 +INFO - Started process 354 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-03-03T00:00:00+00:00', '--job-id', '66', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpbgj7mu4w'] +INFO - Job 66: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180303T000000, start_date=20221111T002547, end_date=20221111T002550 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-03-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:25:50.068640Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e750abea-ba67-4a34-b976-f2b1e9133a3e"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..30f05b8c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:25:47.382656Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ad23a99f-e792-3161-b5d5-8e5c13959c2c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ad23a99f-e792-3161-b5d5-8e5c13959c2c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4e435cef-b7c0-4c5a-b55d-37846c0948fd"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-03-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:25:47.382656+00:00, try_number=1, job_id=65, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-03 00:00:00+00:00 +INFO - Started process 353 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-03-03T00:00:00+00:00', '--job-id', '65', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp8v4z5gql'] +INFO - Job 65: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180303T000000, start_date=20221111T002547, end_date=20221111T002550 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-03-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:25:50.068612Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4e435cef-b7c0-4c5a-b55d-37846c0948fd"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..cee4fcb2 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:25:57.620580Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ad23a99f-e792-3161-b5d5-8e5c13959c2c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ad23a99f-e792-3161-b5d5-8e5c13959c2c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8dbf4d5c-b383-4e34-9c46-3e98532d8b5b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-03-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:25:57.620580+00:00, try_number=1, job_id=70, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-03 00:00:00+00:00 +INFO - Started process 321 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-03-03T00:00:00+00:00', '--job-id', '70', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpkb6un_ra'] +INFO - Job 70: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '+vpcumaw3H10RRLV3CanEw==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:+vpcumaw3H10RRLV3CanEw== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002558Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002558Z +20221111/us-east-1/s3/aws4_request +27482d400503976a00df832fbea1d3d7098ae7761d98b13d5c060279a4559957 +INFO - '2022-11-11' - botocore.auth - Signature: +b925764cc52218f613f42635d8d8bfed6ea579bd75565b8df84841ef3e88e7e2 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'oQd3IhqVYrpVnBoWu4/9c7Tcugno/R0feYNZUoaJ7lIt9Kg8tIbzdVoe4Qvq5Ldkf/15RZCsLIE=', 'x-amz-request-id': '0PD1FAYSFK9W9Y6G', 'Date': 'Fri, 11 Nov 2022 00:25:58 GMT', 'ETag': '"fafa5cba66b0dc7d744512d5dc26a713"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180303T000000, start_date=20221111T002557, end_date=20221111T002559 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-03-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:25:59.498511Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8dbf4d5c-b383-4e34-9c46-3e98532d8b5b"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..392e1da1 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:25:56.269350Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ad23a99f-e792-3161-b5d5-8e5c13959c2c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ad23a99f-e792-3161-b5d5-8e5c13959c2c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f8feb8b0-6a35-4624-a42f-2f4f08570d77"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-03-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:25:56.269350+00:00, try_number=1, job_id=69, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-03 00:00:00+00:00 +INFO - Started process 315 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-03-03T00:00:00+00:00', '--job-id', '69', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpu949ubna'] +INFO - Job 69: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002557Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002557Z +20221111/us-east-1/s3/aws4_request +c738114e699783b87714bc29f19a4942fcdd76b9fcb767077f8b3ac5ad975f7a +INFO - '2022-11-11' - botocore.auth - Signature: +f2c6469c41d32139fd9edc0cc5c4a55b281f1352951c1f7460291eb34c44b80e +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'BHjafCs0E3BsulCqqXsITznOZXZWkADRwQ2WKlMZvqRGsJC4ksSZ6ffnrw9Araxk6Na7Bb3l7no=', 'x-amz-request-id': 'GDFSHX8TJ3J9ZQAB', 'Date': 'Fri, 11 Nov 2022 00:25:57 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180303T000000, start_date=20221111T002556, end_date=20221111T002558 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-03-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:25:58.321652Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f8feb8b0-6a35-4624-a42f-2f4f08570d77"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..b103cb08 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:25:52.299992Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ad23a99f-e792-3161-b5d5-8e5c13959c2c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ad23a99f-e792-3161-b5d5-8e5c13959c2c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3ed9cf2e-7c14-41b5-8466-f28e6bc55769"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-03-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:25:52.299992+00:00, try_number=1, job_id=67, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-03 00:00:00+00:00 +INFO - Started process 309 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-03-03T00:00:00+00:00', '--job-id', '67', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp5052_2co'] +INFO - Job 67: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180303T000000, start_date=20221111T002552, end_date=20221111T002556 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-03-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:25:56.110321Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3ed9cf2e-7c14-41b5-8466-f28e6bc55769"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..fbd393a2 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:25:52.300001Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ad23a99f-e792-3161-b5d5-8e5c13959c2c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ad23a99f-e792-3161-b5d5-8e5c13959c2c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e8f8d768-0dd4-4d69-8cdd-4a7c1e247640"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-03-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:25:52.300001+00:00, try_number=1, job_id=68, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-03 00:00:00+00:00 +INFO - Started process 308 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-03-03T00:00:00+00:00', '--job-id', '68', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpd1x9l_0v'] +INFO - Job 68: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180303T000000, start_date=20221111T002552, end_date=20221111T002554 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-03-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:25:54.755288Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e8f8d768-0dd4-4d69-8cdd-4a7c1e247640"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..08218b84 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:26:01.570682Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6c9cc011-a398-3005-bd1e-624cdb243f21"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6c9cc011-a398-3005-bd1e-624cdb243f21"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "feb15c8f-c8e7-4215-81dd-f9de9c73a39b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-03-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:26:01.570682+00:00, try_number=1, job_id=71, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-04 00:00:00+00:00 +INFO - Started process 335 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-03-04T00:00:00+00:00', '--job-id', '71', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp3me2z_vq'] +INFO - Job 71: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180304T000000, start_date=20221111T002601, end_date=20221111T002605 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-03-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:26:05.351660Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "feb15c8f-c8e7-4215-81dd-f9de9c73a39b"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..cf8e5921 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:26:01.601840Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6c9cc011-a398-3005-bd1e-624cdb243f21"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6c9cc011-a398-3005-bd1e-624cdb243f21"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "793017f0-7b6e-4743-b043-156b65136d72"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-03-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:26:01.601840+00:00, try_number=1, job_id=72, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-04 00:00:00+00:00 +INFO - Started process 339 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-03-04T00:00:00+00:00', '--job-id', '72', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmph5i3nlnd'] +INFO - Job 72: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180304T000000, start_date=20221111T002601, end_date=20221111T002605 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-03-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:26:05.479060Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "793017f0-7b6e-4743-b043-156b65136d72"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..6eea9f2a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:26:13.102323Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6c9cc011-a398-3005-bd1e-624cdb243f21"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6c9cc011-a398-3005-bd1e-624cdb243f21"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "39c7e593-88d8-4b6a-8c4d-fd2f80f46479"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-03-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:26:13.102323+00:00, try_number=1, job_id=75, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-04 00:00:00+00:00 +INFO - Started process 412 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-03-04T00:00:00+00:00', '--job-id', '75', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp3wiws77q'] +INFO - Job 75: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa4ca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '+vpcumaw3H10RRLV3CanEw==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:+vpcumaw3H10RRLV3CanEw== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002613Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002613Z +20221111/us-east-1/s3/aws4_request +89d15d7396b0fa36f2e3f8609c0764c65e213a99f98db7ca7589b2e6dad554a1 +INFO - '2022-11-11' - botocore.auth - Signature: +1a7870151082a7f7bbdeac861622cc665245f8960f5aaef63fb45ea6f72f9e66 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'eaXlE9uzUl7/ho1+qqmp7gG/Qbn4veCmS+6DnqqOyf5O60LKotChqkIVDE7rqfO3/Odi7u662rE=', 'x-amz-request-id': '3QY10A80RYKYX2CF', 'Date': 'Fri, 11 Nov 2022 00:26:14 GMT', 'ETag': '"fafa5cba66b0dc7d744512d5dc26a713"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180304T000000, start_date=20221111T002613, end_date=20221111T002615 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-03-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:26:15.369369Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "39c7e593-88d8-4b6a-8c4d-fd2f80f46479"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..b88b89f2 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:26:13.121746Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6c9cc011-a398-3005-bd1e-624cdb243f21"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6c9cc011-a398-3005-bd1e-624cdb243f21"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0e88f34e-41ca-42ab-b9d6-5142bc65c359"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-03-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:26:13.121746+00:00, try_number=1, job_id=76, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-04 00:00:00+00:00 +INFO - Started process 413 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-03-04T00:00:00+00:00', '--job-id', '76', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpxt1adnqt'] +INFO - Job 76: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5ca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002614Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002614Z +20221111/us-east-1/s3/aws4_request +a07beb2d7f4249274c7e30438bc20534c1f50b056195adef2af89503740e5d0d +INFO - '2022-11-11' - botocore.auth - Signature: +7fb4f9b7f5f1b60e8c16ef0a13d7c7ffd53e0c36e598e4fee89644f4695ea48b +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'Q11kAEqFz86dXAmY4ngC5Em8JD472J6KM/QNcMiPq5XGll49cPh9VUvcjFCP9Vp8NM115NORWIQ=', 'x-amz-request-id': '3QYC9S3AZJJFW9H2', 'Date': 'Fri, 11 Nov 2022 00:26:14 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180304T000000, start_date=20221111T002613, end_date=20221111T002615 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-03-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:26:15.167177Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0e88f34e-41ca-42ab-b9d6-5142bc65c359"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..739b2c69 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:26:07.797779Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6c9cc011-a398-3005-bd1e-624cdb243f21"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6c9cc011-a398-3005-bd1e-624cdb243f21"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "73d3383d-6154-4868-94a0-458c45fcdee8"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-03-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:26:07.797779+00:00, try_number=1, job_id=73, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-04 00:00:00+00:00 +INFO - Started process 425 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-03-04T00:00:00+00:00', '--job-id', '73', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpqz3xow5f'] +INFO - Job 73: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180304T000000, start_date=20221111T002607, end_date=20221111T002611 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-03-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:26:11.557283Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "73d3383d-6154-4868-94a0-458c45fcdee8"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..08b1f3aa --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:26:07.987021Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6c9cc011-a398-3005-bd1e-624cdb243f21"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6c9cc011-a398-3005-bd1e-624cdb243f21"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0857904a-4575-46ee-8116-b3defdd1d3f5"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-03-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:26:07.987021+00:00, try_number=1, job_id=74, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-04 00:00:00+00:00 +INFO - Started process 404 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-03-04T00:00:00+00:00', '--job-id', '74', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpx5pskmau'] +INFO - Job 74: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180304T000000, start_date=20221111T002607, end_date=20221111T002611 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-03-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:26:11.085156Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0857904a-4575-46ee-8116-b3defdd1d3f5"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..c3050edf --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:26:17.181130Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2391e80b-70cc-334d-8fe4-031900bb357a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2391e80b-70cc-334d-8fe4-031900bb357a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f9140f80-e1b6-44e9-93e0-5fb7b03677a3"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-03-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:26:17.181130+00:00, try_number=1, job_id=78, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-05 00:00:00+00:00 +INFO - Started process 434 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-03-05T00:00:00+00:00', '--job-id', '78', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmprtotyjv0'] +INFO - Job 78: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180305T000000, start_date=20221111T002617, end_date=20221111T002620 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-03-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:26:20.319113Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f9140f80-e1b6-44e9-93e0-5fb7b03677a3"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..c0863090 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:26:17.179612Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2391e80b-70cc-334d-8fe4-031900bb357a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2391e80b-70cc-334d-8fe4-031900bb357a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "98d797e4-edf9-4488-a59c-f7651f104d73"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-03-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:26:17.179612+00:00, try_number=1, job_id=77, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-05 00:00:00+00:00 +INFO - Started process 431 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-03-05T00:00:00+00:00', '--job-id', '77', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpuih1s_cn'] +INFO - Job 77: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180305T000000, start_date=20221111T002617, end_date=20221111T002620 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-03-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:26:20.912793Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "98d797e4-edf9-4488-a59c-f7651f104d73"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..bc86d418 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:26:28.027586Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2391e80b-70cc-334d-8fe4-031900bb357a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2391e80b-70cc-334d-8fe4-031900bb357a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6c9ebd10-b4c7-4892-b8e1-b99e0b4c96b2"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-03-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:26:28.027586+00:00, try_number=1, job_id=81, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-05 00:00:00+00:00 +INFO - Started process 447 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-03-05T00:00:00+00:00', '--job-id', '81', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmphmv3r2md'] +INFO - Job 81: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f1f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'fqKwtgAi/madeXOrWfGZ0w==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:fqKwtgAi/madeXOrWfGZ0w== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002628Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002628Z +20221111/us-east-1/s3/aws4_request +94b7561f3e8888933e6c23b46c25053d7a7d4b122065c92b51a85c703c327345 +INFO - '2022-11-11' - botocore.auth - Signature: +43e1a301fbf432ef2ed700d32ece19adbfcfc712f4557c6b41f52635dcc3e3a5 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '96Y5VH3HzPs906Wo/5dWjxIjJ8aP+Kd52tJ5X2qWUNjAu/ytpfe0p81MLTUZpplVP/UiJ9YLEYE=', 'x-amz-request-id': '63VJ9QCXCGWD7V83', 'Date': 'Fri, 11 Nov 2022 00:26:29 GMT', 'ETag': '"7ea2b0b60022fe669d7973ab59f199d3"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180305T000000, start_date=20221111T002628, end_date=20221111T002629 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-03-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:26:29.712486Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6c9ebd10-b4c7-4892-b8e1-b99e0b4c96b2"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..87bf584e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:26:28.027523Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2391e80b-70cc-334d-8fe4-031900bb357a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2391e80b-70cc-334d-8fe4-031900bb357a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cb78e648-b411-448d-8e69-fef9a473c996"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-03-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:26:28.027523+00:00, try_number=1, job_id=82, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-05 00:00:00+00:00 +INFO - Started process 449 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-03-05T00:00:00+00:00', '--job-id', '82', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpk4aiudvo'] +INFO - Job 82: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f1ee0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002628Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002628Z +20221111/us-east-1/s3/aws4_request +68317afd45756fb1145faf833997f8d320bb5ec11492456d3fa55534874a1d93 +INFO - '2022-11-11' - botocore.auth - Signature: +a52a07b9c96917f8a5df5d0324d4127227f9d6f8b933e5372a3fe469f4ca574f +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'RoxH/X03qOABAvwc30IIwepqbWnMaMeIBKh1kyDScw4NY4u54YI/4+WFlspjAhN1heChNCodYKI=', 'x-amz-request-id': '63VMKE53VW7CGCR5', 'Date': 'Fri, 11 Nov 2022 00:26:29 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180305T000000, start_date=20221111T002628, end_date=20221111T002629 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-03-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:26:29.774617Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cb78e648-b411-448d-8e69-fef9a473c996"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..658522c1 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:26:22.066879Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2391e80b-70cc-334d-8fe4-031900bb357a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2391e80b-70cc-334d-8fe4-031900bb357a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0f1277a6-434c-45ee-bd46-cd12724f8742"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-03-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:26:22.066879+00:00, try_number=1, job_id=79, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-05 00:00:00+00:00 +INFO - Started process 423 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-03-05T00:00:00+00:00', '--job-id', '79', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpeogzuzdy'] +INFO - Job 79: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180305T000000, start_date=20221111T002622, end_date=20221111T002626 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-03-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:26:26.793472Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0f1277a6-434c-45ee-bd46-cd12724f8742"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..f84c38e5 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:26:23.443630Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2391e80b-70cc-334d-8fe4-031900bb357a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2391e80b-70cc-334d-8fe4-031900bb357a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a1cce4eb-56eb-48a9-9282-daa90a4c34ab"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-03-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:26:23.443630+00:00, try_number=1, job_id=80, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-05 00:00:00+00:00 +INFO - Started process 440 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-03-05T00:00:00+00:00', '--job-id', '80', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpfzt_mhgr'] +INFO - Job 80: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180305T000000, start_date=20221111T002623, end_date=20221111T002626 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-03-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:26:26.701823Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a1cce4eb-56eb-48a9-9282-daa90a4c34ab"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..b509c4e2 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:26:32.277045Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6cb6b049-1d02-3f54-aa21-7317207a1921"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6cb6b049-1d02-3f54-aa21-7317207a1921"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "08815ed1-a359-4b24-b962-10ed5cfcf460"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-03-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:26:32.277045+00:00, try_number=1, job_id=83, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-06 00:00:00+00:00 +INFO - Started process 466 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-03-06T00:00:00+00:00', '--job-id', '83', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpboo2dn4y'] +INFO - Job 83: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180306T000000, start_date=20221111T002632, end_date=20221111T002634 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-03-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:26:34.915234Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "08815ed1-a359-4b24-b962-10ed5cfcf460"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..7f3a8468 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:26:32.312173Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6cb6b049-1d02-3f54-aa21-7317207a1921"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6cb6b049-1d02-3f54-aa21-7317207a1921"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fd8750fc-80e4-4279-9440-dc289d8f32f9"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-03-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:26:32.312173+00:00, try_number=1, job_id=84, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-06 00:00:00+00:00 +INFO - Started process 468 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-03-06T00:00:00+00:00', '--job-id', '84', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpgbm00aw2'] +INFO - Job 84: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180306T000000, start_date=20221111T002632, end_date=20221111T002634 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-03-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:26:34.926043Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fd8750fc-80e4-4279-9440-dc289d8f32f9"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..991b150d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:26:42.305567Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6cb6b049-1d02-3f54-aa21-7317207a1921"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6cb6b049-1d02-3f54-aa21-7317207a1921"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8ca0804a-4c1d-4520-861e-6e6f4eb42111"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-03-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:26:42.305567+00:00, try_number=1, job_id=88, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-06 00:00:00+00:00 +INFO - Started process 499 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-03-06T00:00:00+00:00', '--job-id', '88', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpto1z8tke'] +INFO - Job 88: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'E0P3oTu9aOkptHvsAXWh+g==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:E0P3oTu9aOkptHvsAXWh+g== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002642Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002642Z +20221111/us-east-1/s3/aws4_request +a166bb4819378f7229a9c7b266e5932dd80a7273745ef0d2c1799f65824415e0 +INFO - '2022-11-11' - botocore.auth - Signature: +14a05124e0bc603e53cbf921d109ced17bc26c75436acec9f9f617ef5ed73c31 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'zl6zqj+lPOTllccrv3yI3YU9oqFeZJhBXAPYXB/mbTS285/5J9R40sbnVjBfs7L1msSR9pV9IuM6UK92s1OwuA==', 'x-amz-request-id': '04GGNSKJPGAWVTMC', 'Date': 'Fri, 11 Nov 2022 00:26:43 GMT', 'ETag': '"1343f7a13bbd68e929b47bec0175a1fa"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180306T000000, start_date=20221111T002642, end_date=20221111T002644 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-03-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:26:44.067672Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8ca0804a-4c1d-4520-861e-6e6f4eb42111"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..601f894b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:26:41.607774Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6cb6b049-1d02-3f54-aa21-7317207a1921"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6cb6b049-1d02-3f54-aa21-7317207a1921"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "447ec19a-d490-4392-821b-0e1b85440e58"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-03-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:26:41.607774+00:00, try_number=1, job_id=87, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-06 00:00:00+00:00 +INFO - Started process 494 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-03-06T00:00:00+00:00', '--job-id', '87', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpukc58q56'] +INFO - Job 87: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa4ca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002642Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002642Z +20221111/us-east-1/s3/aws4_request +a08fa15750cc5c2c83f4e06cdd21dc7a573a3fc97a1903f5152eaf3b87414b8f +INFO - '2022-11-11' - botocore.auth - Signature: +9327a31979c84ba3b194c7e2875a19367e1eff79d0e8cb5bc1d069d0cc3166b8 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '+JFWszhvBgxSCxM033sxtj7VrcEuvJ4Oks1rS9ZQ+H7nGjZ45rJm8yXIL3+/1M7/1kM2anRz8EEn9D9QU3Sbwg==', 'x-amz-request-id': '04GM7SHA9QZB9M41', 'Date': 'Fri, 11 Nov 2022 00:26:43 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180306T000000, start_date=20221111T002641, end_date=20221111T002643 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-03-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:26:43.851060Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "447ec19a-d490-4392-821b-0e1b85440e58"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..075474da --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:26:36.834842Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6cb6b049-1d02-3f54-aa21-7317207a1921"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6cb6b049-1d02-3f54-aa21-7317207a1921"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e5de92dc-1a3d-4a43-b591-59e16597beff"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-03-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:26:36.834842+00:00, try_number=1, job_id=85, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-06 00:00:00+00:00 +INFO - Started process 533 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-03-06T00:00:00+00:00', '--job-id', '85', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpdjc7fvfb'] +INFO - Job 85: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180306T000000, start_date=20221111T002636, end_date=20221111T002640 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-03-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:26:40.582487Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e5de92dc-1a3d-4a43-b591-59e16597beff"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..76bbee36 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:26:36.867910Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6cb6b049-1d02-3f54-aa21-7317207a1921"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6cb6b049-1d02-3f54-aa21-7317207a1921"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1ede0410-cd71-4ba7-a01a-1b792f0e4d36"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-03-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:26:36.867910+00:00, try_number=1, job_id=86, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-06 00:00:00+00:00 +INFO - Started process 534 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-03-06T00:00:00+00:00', '--job-id', '86', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp_iutgt7o'] +INFO - Job 86: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180306T000000, start_date=20221111T002636, end_date=20221111T002640 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-03-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:26:40.075155Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1ede0410-cd71-4ba7-a01a-1b792f0e4d36"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..c9df6fdb --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:26:46.064128Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "84565895-73ab-364d-a00b-d6cba3900730"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "84565895-73ab-364d-a00b-d6cba3900730"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f741e974-0402-4334-9304-a38947341bda"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-03-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:26:46.064128+00:00, try_number=1, job_id=90, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-07 00:00:00+00:00 +INFO - Started process 511 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-03-07T00:00:00+00:00', '--job-id', '90', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpnrviv9oi'] +INFO - Job 90: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180307T000000, start_date=20221111T002646, end_date=20221111T002648 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-03-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:26:48.942133Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f741e974-0402-4334-9304-a38947341bda"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..1a1712fb --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:26:46.003254Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "84565895-73ab-364d-a00b-d6cba3900730"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "84565895-73ab-364d-a00b-d6cba3900730"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9c46a3b7-8f98-407f-a14a-320c716c6e26"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-03-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:26:46.003254+00:00, try_number=1, job_id=89, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-07 00:00:00+00:00 +INFO - Started process 509 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-03-07T00:00:00+00:00', '--job-id', '89', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp1y6w8l68'] +INFO - Job 89: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180307T000000, start_date=20221111T002646, end_date=20221111T002648 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-03-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:26:48.943951Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9c46a3b7-8f98-407f-a14a-320c716c6e26"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..5edaec17 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:26:54.553065Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "84565895-73ab-364d-a00b-d6cba3900730"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "84565895-73ab-364d-a00b-d6cba3900730"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b4d0856d-e4bd-4f22-8cc1-8c845ee1ceb4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-03-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:26:54.553065+00:00, try_number=1, job_id=94, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-07 00:00:00+00:00 +INFO - Started process 531 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-03-07T00:00:00+00:00', '--job-id', '94', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp57xwnerz'] +INFO - Job 94: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa4f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'lM/+rM/sQJE9XhGrSFJ+sw==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:lM/+rM/sQJE9XhGrSFJ+sw== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002655Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002655Z +20221111/us-east-1/s3/aws4_request +9388273538fdf9d63deb3c86bc79fbec0550142d0ec4f3bcd7eb0c8614688b2e +INFO - '2022-11-11' - botocore.auth - Signature: +c6f0b56a97f4ffa38a8d7e9c9e8ad17928020b365a0bcec68e09e0d67b45c665 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'u+15aboXSEZbtWKYGFpy5CLghDQ9KjDH7woomnGmLJlmzOSu/ntWaoAVfD3w4moUqzf4MOjPzBI=', 'x-amz-request-id': 'JJW306TM4TT13XFV', 'Date': 'Fri, 11 Nov 2022 00:26:55 GMT', 'ETag': '"94cffeaccfec40913d5e11ab48527eb3"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180307T000000, start_date=20221111T002654, end_date=20221111T002657 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-03-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:26:57.048718Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b4d0856d-e4bd-4f22-8cc1-8c845ee1ceb4"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..3d9a594d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:26:54.492412Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "84565895-73ab-364d-a00b-d6cba3900730"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "84565895-73ab-364d-a00b-d6cba3900730"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "56d7ae98-4519-48eb-ae10-7223fe9364d0"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-03-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:26:54.492412+00:00, try_number=1, job_id=93, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-07 00:00:00+00:00 +INFO - Started process 529 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-03-07T00:00:00+00:00', '--job-id', '93', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmptv77ls5i'] +INFO - Job 93: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa4f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002655Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002655Z +20221111/us-east-1/s3/aws4_request +148f914fd4f34960fe5f9c13ca916b68c2b3dff63ca5a2926e66fc620b7ec1cd +INFO - '2022-11-11' - botocore.auth - Signature: +03a378e25d7de0ce0cc4db799f9cb9210af4ab91b6fe9c0a466b20459d3f37d9 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'WphfqRpWz8HYqZoFutPboal6sjPr9YmHr1+88Wb4bCWUXOFuZDPaIgTgjBj3hP1r7Bspy35u5hI=', 'x-amz-request-id': 'JJWCN6M4565FYS1B', 'Date': 'Fri, 11 Nov 2022 00:26:55 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180307T000000, start_date=20221111T002654, end_date=20221111T002656 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-03-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:26:56.778936Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "56d7ae98-4519-48eb-ae10-7223fe9364d0"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..ba0f1ca9 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:26:50.243772Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "84565895-73ab-364d-a00b-d6cba3900730"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "84565895-73ab-364d-a00b-d6cba3900730"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9d7f7095-38e1-435f-abb3-5f7fc7e51d55"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-03-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:26:50.243772+00:00, try_number=1, job_id=91, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-07 00:00:00+00:00 +INFO - Started process 520 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-03-07T00:00:00+00:00', '--job-id', '91', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpfgdrr8ul'] +INFO - Job 91: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180307T000000, start_date=20221111T002650, end_date=20221111T002653 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-03-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:26:53.251935Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9d7f7095-38e1-435f-abb3-5f7fc7e51d55"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..f4c13b28 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:26:50.246617Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "84565895-73ab-364d-a00b-d6cba3900730"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "84565895-73ab-364d-a00b-d6cba3900730"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c2be86aa-1042-4339-854d-0174bb98a52a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-03-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:26:50.246617+00:00, try_number=1, job_id=92, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-07 00:00:00+00:00 +INFO - Started process 521 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-03-07T00:00:00+00:00', '--job-id', '92', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpixgkepp_'] +INFO - Job 92: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180307T000000, start_date=20221111T002650, end_date=20221111T002653 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-03-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:26:53.132576Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c2be86aa-1042-4339-854d-0174bb98a52a"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..4f89b160 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:26:58.827245Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "4f2d94bc-ddc0-3a3a-af56-22625f5f12a5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "4f2d94bc-ddc0-3a3a-af56-22625f5f12a5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c03287b3-a9f3-442c-b136-58f807cd07a3"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-03-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:26:58.827245+00:00, try_number=1, job_id=95, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-08 00:00:00+00:00 +INFO - Started process 545 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-03-08T00:00:00+00:00', '--job-id', '95', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp07745c43'] +INFO - Job 95: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180308T000000, start_date=20221111T002658, end_date=20221111T002702 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-03-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:27:02.145326Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c03287b3-a9f3-442c-b136-58f807cd07a3"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..d43e52cc --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:26:58.838684Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "4f2d94bc-ddc0-3a3a-af56-22625f5f12a5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "4f2d94bc-ddc0-3a3a-af56-22625f5f12a5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "21b8fe71-65d4-4e9a-9915-25e2f2844d8d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-03-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:26:58.838684+00:00, try_number=1, job_id=96, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-08 00:00:00+00:00 +INFO - Started process 543 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-03-08T00:00:00+00:00', '--job-id', '96', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp1y13j7v7'] +INFO - Job 96: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180308T000000, start_date=20221111T002658, end_date=20221111T002702 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-03-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:27:02.137348Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "21b8fe71-65d4-4e9a-9915-25e2f2844d8d"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..30513483 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:27:12.288118Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "4f2d94bc-ddc0-3a3a-af56-22625f5f12a5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "4f2d94bc-ddc0-3a3a-af56-22625f5f12a5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bb21129f-0ec8-4ee2-aa31-7eeb1e156229"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-03-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:27:12.288118+00:00, try_number=1, job_id=100, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-08 00:00:00+00:00 +INFO - Started process 616 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-03-08T00:00:00+00:00', '--job-id', '100', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp4xz0i1f3'] +INFO - Job 100: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'lM/+rM/sQJE9XhGrSFJ+sw==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:lM/+rM/sQJE9XhGrSFJ+sw== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002712Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002712Z +20221111/us-east-1/s3/aws4_request +44aec1c929e04b1e380f8d34f0a7da9c14562da87262e1d8a735b12fbdcafc7c +INFO - '2022-11-11' - botocore.auth - Signature: +dbad746151818b372449703a1898d0f61be012d712f5cc57dc2cb8a442a50770 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'NrsAzS6ZA1ubqwzyXLg1KnqyYkZaUhDp3ByIRJGvBLS+EqPJvG3W3W/irPl2FDaMap+sG/aNh94=', 'x-amz-request-id': '0W1CGZXE0Y299HDS', 'Date': 'Fri, 11 Nov 2022 00:27:13 GMT', 'ETag': '"94cffeaccfec40913d5e11ab48527eb3"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180308T000000, start_date=20221111T002712, end_date=20221111T002713 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-03-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:27:13.707376Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bb21129f-0ec8-4ee2-aa31-7eeb1e156229"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..62b9a2a8 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:27:08.874361Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "4f2d94bc-ddc0-3a3a-af56-22625f5f12a5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "4f2d94bc-ddc0-3a3a-af56-22625f5f12a5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "99a21432-4cf1-4f71-8b45-a0dd38746f2b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-03-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:27:08.874361+00:00, try_number=1, job_id=99, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-08 00:00:00+00:00 +INFO - Started process 618 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-03-08T00:00:00+00:00', '--job-id', '99', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpqjovxhfi'] +INFO - Job 99: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499533a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002709Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002709Z +20221111/us-east-1/s3/aws4_request +90e3e5afb65327ad9bda18ab1ffa832bd931354d2f89cb16dd8ddcb13ac24a0c +INFO - '2022-11-11' - botocore.auth - Signature: +c00f57003f80145d0f5c087c153b01e656ee60456f34fb620170b64798377094 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'fLiW2W2Bcuoc0QhbaLMa1Ps7FsngGE2FZCQfm2Agi/PJcTmAua2th9QjkVP9vST3tR2FHoexOZI=', 'x-amz-request-id': '6H1DTH314TX3FB3C', 'Date': 'Fri, 11 Nov 2022 00:27:10 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180308T000000, start_date=20221111T002708, end_date=20221111T002711 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-03-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:27:11.419420Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "99a21432-4cf1-4f71-8b45-a0dd38746f2b"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..9a2609e3 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:27:03.776511Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "4f2d94bc-ddc0-3a3a-af56-22625f5f12a5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "4f2d94bc-ddc0-3a3a-af56-22625f5f12a5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bb524089-5d2c-46cb-a72f-1473e0713996"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-03-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:27:03.776511+00:00, try_number=1, job_id=97, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-08 00:00:00+00:00 +INFO - Started process 553 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-03-08T00:00:00+00:00', '--job-id', '97', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpvcrrtq5l'] +INFO - Job 97: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180308T000000, start_date=20221111T002703, end_date=20221111T002710 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-03-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:27:10.112844Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bb524089-5d2c-46cb-a72f-1473e0713996"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..e83128da --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:27:03.784173Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "4f2d94bc-ddc0-3a3a-af56-22625f5f12a5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "4f2d94bc-ddc0-3a3a-af56-22625f5f12a5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6438e468-2eee-43b1-9ae0-797502ec6992"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-03-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:27:03.784173+00:00, try_number=1, job_id=98, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-08 00:00:00+00:00 +INFO - Started process 551 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-03-08T00:00:00+00:00', '--job-id', '98', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmppkhytji0'] +INFO - Job 98: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180308T000000, start_date=20221111T002703, end_date=20221111T002706 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-03-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:27:06.599478Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6438e468-2eee-43b1-9ae0-797502ec6992"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..6d5c5b5e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:27:15.920038Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7f9a06ff-8dfd-3fdd-ae8d-3e4be08f43f6"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7f9a06ff-8dfd-3fdd-ae8d-3e4be08f43f6"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1d272432-d223-4dec-b2fb-713023b9da82"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-03-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:27:15.920038+00:00, try_number=1, job_id=101, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-09 00:00:00+00:00 +INFO - Started process 626 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-03-09T00:00:00+00:00', '--job-id', '101', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpblzndwt7'] +INFO - Job 101: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180309T000000, start_date=20221111T002715, end_date=20221111T002719 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-03-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:27:19.136771Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1d272432-d223-4dec-b2fb-713023b9da82"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..95464c9b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:27:15.923711Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7f9a06ff-8dfd-3fdd-ae8d-3e4be08f43f6"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7f9a06ff-8dfd-3fdd-ae8d-3e4be08f43f6"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "eefd059f-1c0e-491c-a99e-390f340e029c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-03-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:27:15.923711+00:00, try_number=1, job_id=102, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-09 00:00:00+00:00 +INFO - Started process 627 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-03-09T00:00:00+00:00', '--job-id', '102', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpe7qv2kdv'] +INFO - Job 102: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180309T000000, start_date=20221111T002715, end_date=20221111T002719 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-03-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:27:19.149503Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "eefd059f-1c0e-491c-a99e-390f340e029c"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..1f310ab1 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:27:26.001071Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7f9a06ff-8dfd-3fdd-ae8d-3e4be08f43f6"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7f9a06ff-8dfd-3fdd-ae8d-3e4be08f43f6"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ccb3e872-0cdf-45d9-9324-8427b68ce551"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-03-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:27:26.001071+00:00, try_number=1, job_id=106, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-09 00:00:00+00:00 +INFO - Started process 630 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-03-09T00:00:00+00:00', '--job-id', '106', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmprfg7vn76'] +INFO - Job 106: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f1ca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '1hjxOzPvK9TPxXAnIfsqBw==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:1hjxOzPvK9TPxXAnIfsqBw== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002726Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002726Z +20221111/us-east-1/s3/aws4_request +8da246c9936f895b95c419bb22aaed8ab9cd7ff8b4f0fe52bfcd75de56a65abb +INFO - '2022-11-11' - botocore.auth - Signature: +802e63567207d24f9bf433b88debea0335e154b1d530391b4a4842e16cf81dbc +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'rtHV+KavsiQaI/6c9gj9jGUvbBoEbkFMVFv/8ba73WLzw9bkSV6uym11A+TQ7FRjyvpfyge6NwI=', 'x-amz-request-id': 'B7GRZP3KWENA0JKB', 'Date': 'Fri, 11 Nov 2022 00:27:27 GMT', 'ETag': '"d618f13b33ef2bd4cfc5702721fb2a07"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180309T000000, start_date=20221111T002726, end_date=20221111T002727 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-03-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:27:27.800615Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ccb3e872-0cdf-45d9-9324-8427b68ce551"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..9d60afac --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:27:25.937675Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7f9a06ff-8dfd-3fdd-ae8d-3e4be08f43f6"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7f9a06ff-8dfd-3fdd-ae8d-3e4be08f43f6"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "53cf1609-97cb-4b3a-b4bf-3868d76bc580"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-03-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:27:25.937675+00:00, try_number=1, job_id=105, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-09 00:00:00+00:00 +INFO - Started process 628 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-03-09T00:00:00+00:00', '--job-id', '105', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpxu8lillb'] +INFO - Job 105: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0ca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002726Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002726Z +20221111/us-east-1/s3/aws4_request +5b4eb7d6a46bbc3c44f1f580951ff01c4f5123041c565cbe59655389a71fab54 +INFO - '2022-11-11' - botocore.auth - Signature: +4f521bb6213f0547181f12908d44471503363728bb099b5984f979209eff7083 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '6spy3Gl7ViB9FD5l6UCVdIbcMrjbzVCnpBCzX5buKvLLOQW7YEyksdWE9r9REJxIBsJmMsKxdfE=', 'x-amz-request-id': 'B7GYN10ZAE2S78BN', 'Date': 'Fri, 11 Nov 2022 00:27:27 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180309T000000, start_date=20221111T002725, end_date=20221111T002727 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-03-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:27:27.653538Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "53cf1609-97cb-4b3a-b4bf-3868d76bc580"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..780f900a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:27:21.361930Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7f9a06ff-8dfd-3fdd-ae8d-3e4be08f43f6"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7f9a06ff-8dfd-3fdd-ae8d-3e4be08f43f6"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0ce263e3-0419-44a6-a56a-b2637d87e3bd"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-03-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:27:21.361930+00:00, try_number=1, job_id=103, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-09 00:00:00+00:00 +INFO - Started process 634 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-03-09T00:00:00+00:00', '--job-id', '103', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpzq7hs707'] +INFO - Job 103: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180309T000000, start_date=20221111T002721, end_date=20221111T002724 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-03-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:27:24.595067Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0ce263e3-0419-44a6-a56a-b2637d87e3bd"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..e8aa38f0 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:27:21.390465Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7f9a06ff-8dfd-3fdd-ae8d-3e4be08f43f6"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7f9a06ff-8dfd-3fdd-ae8d-3e4be08f43f6"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3c1ad13c-8118-43b8-a669-96fbda4039a8"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-03-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:27:21.390465+00:00, try_number=1, job_id=104, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-09 00:00:00+00:00 +INFO - Started process 637 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-03-09T00:00:00+00:00', '--job-id', '104', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmptgtjm393'] +INFO - Job 104: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180309T000000, start_date=20221111T002721, end_date=20221111T002724 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-03-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:27:24.455212Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3c1ad13c-8118-43b8-a669-96fbda4039a8"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..c78b2a73 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:27:29.479761Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "46140dd3-f6a6-3300-b827-0c5f58912347"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "46140dd3-f6a6-3300-b827-0c5f58912347"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "dca6aa3c-d0b6-4c18-8d33-991893b2014f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-03-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:27:29.479761+00:00, try_number=1, job_id=108, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-10 00:00:00+00:00 +INFO - Started process 647 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-03-10T00:00:00+00:00', '--job-id', '108', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpx2pbuef0'] +INFO - Job 108: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180310T000000, start_date=20221111T002729, end_date=20221111T002732 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-03-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:27:32.687915Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "dca6aa3c-d0b6-4c18-8d33-991893b2014f"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..7078bb57 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:27:29.476297Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "46140dd3-f6a6-3300-b827-0c5f58912347"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "46140dd3-f6a6-3300-b827-0c5f58912347"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bb2cfc2d-c587-4f2a-a75e-30df262f8cb6"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-03-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:27:29.476297+00:00, try_number=1, job_id=107, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-10 00:00:00+00:00 +INFO - Started process 646 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-03-10T00:00:00+00:00', '--job-id', '107', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpo25530zr'] +INFO - Job 107: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180310T000000, start_date=20221111T002729, end_date=20221111T002732 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-03-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:27:32.771791Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bb2cfc2d-c587-4f2a-a75e-30df262f8cb6"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..51270caa --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:27:44.185081Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "46140dd3-f6a6-3300-b827-0c5f58912347"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "46140dd3-f6a6-3300-b827-0c5f58912347"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f7045ec2-577f-480b-8a41-d294ac1e3d19"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-03-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:27:44.185081+00:00, try_number=1, job_id=112, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-10 00:00:00+00:00 +INFO - Started process 725 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-03-10T00:00:00+00:00', '--job-id', '112', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp774m7wcn'] +INFO - Job 112: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa4f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'pcPdNjaW/JlYHdJqdJNWpQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:pcPdNjaW/JlYHdJqdJNWpQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002744Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002744Z +20221111/us-east-1/s3/aws4_request +61f3d54f0ada8b6f0ac93d1fbb84a70e2a6b1d57db11b2554eea66626b519aa2 +INFO - '2022-11-11' - botocore.auth - Signature: +3ac6f7ab6fe837a496cb3bc080c20e7cb639cc5d6b47dc59fbcc947c43eaa043 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '3F84Dtwq/IQWYKqL/OAV0nVSnh2mVz3tEiMkVL3jpb8vfWNZMKvoYoBbhR8ir2neeaTmjlEBfkc=', 'x-amz-request-id': 'VWE1WEDTE0JH8P92', 'Date': 'Fri, 11 Nov 2022 00:27:45 GMT', 'ETag': '"a5c3dd363696fc99581dd26a749356a5"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180310T000000, start_date=20221111T002744, end_date=20221111T002746 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-03-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:27:46.276287Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f7045ec2-577f-480b-8a41-d294ac1e3d19"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..4d14657e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:27:40.808863Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "46140dd3-f6a6-3300-b827-0c5f58912347"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "46140dd3-f6a6-3300-b827-0c5f58912347"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "376ea933-921d-4b87-8495-fc9f81085a17"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-03-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:27:40.808863+00:00, try_number=1, job_id=111, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-10 00:00:00+00:00 +INFO - Started process 718 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-03-10T00:00:00+00:00', '--job-id', '111', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp2ls2niku'] +INFO - Job 111: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50063a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002741Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002741Z +20221111/us-east-1/s3/aws4_request +3e2bd5964fad1f8dc266d5ea93dd398b2988ac3ada443f1bb180dfe3b1fa65b8 +INFO - '2022-11-11' - botocore.auth - Signature: +81a503fe09933b7e38b86cabc0c4e45d2af559656ee1dcec22a7ad62367487b2 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '+ZMcQqArf/N4HFhaX0LCcLyTNefkXDc1H2sRAiKvM6MoeEIri3RYstuVO9W/D0E6pVsLJVlt+UMw4KuBKBgctg==', 'x-amz-request-id': 'ZW9P87A62RXMKMP7', 'Date': 'Fri, 11 Nov 2022 00:27:42 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180310T000000, start_date=20221111T002740, end_date=20221111T002743 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-03-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:27:43.281905Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "376ea933-921d-4b87-8495-fc9f81085a17"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..a75b0373 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:27:35.496655Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "46140dd3-f6a6-3300-b827-0c5f58912347"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "46140dd3-f6a6-3300-b827-0c5f58912347"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "36cc1599-48b2-4ca5-8be3-4f5f701dde9c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-03-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:27:35.496655+00:00, try_number=1, job_id=109, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-10 00:00:00+00:00 +INFO - Started process 661 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-03-10T00:00:00+00:00', '--job-id', '109', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpn5sjy4lq'] +INFO - Job 109: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180310T000000, start_date=20221111T002735, end_date=20221111T002742 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-03-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:27:42.022261Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "36cc1599-48b2-4ca5-8be3-4f5f701dde9c"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..c563e21a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:27:35.584440Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "46140dd3-f6a6-3300-b827-0c5f58912347"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "46140dd3-f6a6-3300-b827-0c5f58912347"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5c796d51-3d3c-4a13-8bc2-5067353ae2ea"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-03-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:27:35.584440+00:00, try_number=1, job_id=110, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-10 00:00:00+00:00 +INFO - Started process 664 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-03-10T00:00:00+00:00', '--job-id', '110', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpvqwv243x'] +INFO - Job 110: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180310T000000, start_date=20221111T002735, end_date=20221111T002739 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-03-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:27:39.128679Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5c796d51-3d3c-4a13-8bc2-5067353ae2ea"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..a019956c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:27:49.329736Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0f4026a1-e7a9-361a-8cce-df0f908336bb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0f4026a1-e7a9-361a-8cce-df0f908336bb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "58826736-3a3d-4955-8898-33be1201a9d2"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-03-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:27:49.329736+00:00, try_number=1, job_id=113, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-11 00:00:00+00:00 +INFO - Started process 736 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-03-11T00:00:00+00:00', '--job-id', '113', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmps2w3k7gd'] +INFO - Job 113: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180311T000000, start_date=20221111T002749, end_date=20221111T002752 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-03-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:27:52.376695Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "58826736-3a3d-4955-8898-33be1201a9d2"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..c95c9c54 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:27:49.329019Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0f4026a1-e7a9-361a-8cce-df0f908336bb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0f4026a1-e7a9-361a-8cce-df0f908336bb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9e32b84a-8dd6-4c59-a931-b502b3e086c1"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-03-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:27:49.329019+00:00, try_number=1, job_id=114, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-11 00:00:00+00:00 +INFO - Started process 735 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-03-11T00:00:00+00:00', '--job-id', '114', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp7w4rkp_h'] +INFO - Job 114: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180311T000000, start_date=20221111T002749, end_date=20221111T002752 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-03-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:27:52.300593Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9e32b84a-8dd6-4c59-a931-b502b3e086c1"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..a1028c28 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:27:58.783310Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0f4026a1-e7a9-361a-8cce-df0f908336bb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0f4026a1-e7a9-361a-8cce-df0f908336bb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a208c8bf-8e54-4cd2-bfff-0144887066c4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-03-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:27:58.783310+00:00, try_number=1, job_id=118, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-11 00:00:00+00:00 +INFO - Started process 756 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-03-11T00:00:00+00:00', '--job-id', '118', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpehrkl2b8'] +INFO - Job 118: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'MllJ9/evZUgKOAi4Bq6JJQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:MllJ9/evZUgKOAi4Bq6JJQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002759Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002759Z +20221111/us-east-1/s3/aws4_request +967a8aefc637faac04f05cb899ed66d468fe66251b7f4af18b33b8ab51718375 +INFO - '2022-11-11' - botocore.auth - Signature: +0d13a0feb1a271d8b2210a6de15cc07fa9e896494306606b7e366b7b2cfae7a1 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'PKNPlOlshjZ13iwm7uzuS4wko/VC4VeJBiKGdYsOnypi6mti8PpkNPi7BmXq0CCF7ctUJpT09kM=', 'x-amz-request-id': 'Q4N7PB73TZC8GRZQ', 'Date': 'Fri, 11 Nov 2022 00:28:00 GMT', 'ETag': '"325949f7f7af65480a3808b806ae8925"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180311T000000, start_date=20221111T002758, end_date=20221111T002801 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-03-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:28:01.469592Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a208c8bf-8e54-4cd2-bfff-0144887066c4"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..436f9c73 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:27:58.669823Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0f4026a1-e7a9-361a-8cce-df0f908336bb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0f4026a1-e7a9-361a-8cce-df0f908336bb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b258f360-2d9a-4500-8eff-951f33044df4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-03-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:27:58.669823+00:00, try_number=1, job_id=117, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-11 00:00:00+00:00 +INFO - Started process 753 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-03-11T00:00:00+00:00', '--job-id', '117', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp9jcchknc'] +INFO - Job 117: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6ee0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002759Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002759Z +20221111/us-east-1/s3/aws4_request +3f71156e1b69364783243d46388c1ae0395914da187ddc66538eea6c650114ea +INFO - '2022-11-11' - botocore.auth - Signature: +ef9a790a2fb00d54a3e4b011cffb8eea9023b977d33573b6c42f3720f8528064 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'HnbGBqxKjQrh0GeKQV+WMDOo2bXvaGJXdrjONaDvgSrRsQLD1jAu+ODUvJRQb0VcyhIouhkF5o0=', 'x-amz-request-id': 'Q4N0B763J9HXR2YN', 'Date': 'Fri, 11 Nov 2022 00:28:00 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180311T000000, start_date=20221111T002758, end_date=20221111T002801 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-03-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:28:01.361043Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b258f360-2d9a-4500-8eff-951f33044df4"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..dd1eb6f3 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:27:53.845080Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0f4026a1-e7a9-361a-8cce-df0f908336bb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0f4026a1-e7a9-361a-8cce-df0f908336bb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c6729375-1834-46ab-bc9a-8e9b63db1d98"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-03-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:27:53.845080+00:00, try_number=1, job_id=115, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-11 00:00:00+00:00 +INFO - Started process 745 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-03-11T00:00:00+00:00', '--job-id', '115', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp589n3q9r'] +INFO - Job 115: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180311T000000, start_date=20221111T002753, end_date=20221111T002757 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-03-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:27:57.349963Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c6729375-1834-46ab-bc9a-8e9b63db1d98"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..bf86d2a9 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:27:53.870263Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0f4026a1-e7a9-361a-8cce-df0f908336bb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0f4026a1-e7a9-361a-8cce-df0f908336bb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2fe31c1b-7a15-4036-b646-d168fa84f7ff"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-03-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:27:53.870263+00:00, try_number=1, job_id=116, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-11 00:00:00+00:00 +INFO - Started process 746 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-03-11T00:00:00+00:00', '--job-id', '116', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpdo55ke_y'] +INFO - Job 116: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180311T000000, start_date=20221111T002753, end_date=20221111T002756 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-03-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:27:56.938680Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2fe31c1b-7a15-4036-b646-d168fa84f7ff"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..6bd8034d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:28:03.233230Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d901add2-505f-363f-bdbe-c85dcab4f316"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d901add2-505f-363f-bdbe-c85dcab4f316"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1cb86b5b-fd22-415c-8348-2665d44c12f4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-03-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:28:03.233230+00:00, try_number=1, job_id=119, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-12 00:00:00+00:00 +INFO - Started process 719 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-03-12T00:00:00+00:00', '--job-id', '119', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpl5zc2aqq'] +INFO - Job 119: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180312T000000, start_date=20221111T002803, end_date=20221111T002806 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-03-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:28:06.666722Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1cb86b5b-fd22-415c-8348-2665d44c12f4"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..b46b2ec5 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:28:03.234782Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d901add2-505f-363f-bdbe-c85dcab4f316"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d901add2-505f-363f-bdbe-c85dcab4f316"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cbbb6834-f9c8-4cd6-82a4-dc4709424719"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-03-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:28:03.234782+00:00, try_number=1, job_id=120, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-12 00:00:00+00:00 +INFO - Started process 718 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-03-12T00:00:00+00:00', '--job-id', '120', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp2mzo5pj8'] +INFO - Job 120: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180312T000000, start_date=20221111T002803, end_date=20221111T002806 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-03-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:28:06.693281Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cbbb6834-f9c8-4cd6-82a4-dc4709424719"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..2a580307 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:28:15.286003Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d901add2-505f-363f-bdbe-c85dcab4f316"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d901add2-505f-363f-bdbe-c85dcab4f316"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0dcd956c-0cc6-4f58-b98d-7dcfbc5d3b7d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-03-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:28:15.286003+00:00, try_number=1, job_id=124, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-12 00:00:00+00:00 +INFO - Started process 831 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-03-12T00:00:00+00:00', '--job-id', '124', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpy_1g7nuu'] +INFO - Job 124: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'MllJ9/evZUgKOAi4Bq6JJQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:MllJ9/evZUgKOAi4Bq6JJQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002816Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002816Z +20221111/us-east-1/s3/aws4_request +69a9a798bced6ccd1233de4f47e90b340d22e4708b52cc5b6d1d8131427e8fc2 +INFO - '2022-11-11' - botocore.auth - Signature: +af566f40b7804fb31749a9f7d46bf1f1c4b611c9073b3c62e8c02d153d051306 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'KK2n3Qo+khP1vzcH4GK0md2rIhwC5RgtoHsBwVCbyhxBm+cUvmtC++XtQKFwxmd2Vx3cHB7wreo=', 'x-amz-request-id': 'WTF0F26H74QQ35MN', 'Date': 'Fri, 11 Nov 2022 00:28:16 GMT', 'ETag': '"325949f7f7af65480a3808b806ae8925"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180312T000000, start_date=20221111T002815, end_date=20221111T002816 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-03-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:28:16.967172Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0dcd956c-0cc6-4f58-b98d-7dcfbc5d3b7d"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..28c9fb26 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:28:13.451144Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d901add2-505f-363f-bdbe-c85dcab4f316"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d901add2-505f-363f-bdbe-c85dcab4f316"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "281a03dc-7a31-40dd-8244-893b60d5fe46"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-03-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:28:13.451144+00:00, try_number=1, job_id=123, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-12 00:00:00+00:00 +INFO - Started process 799 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-03-12T00:00:00+00:00', '--job-id', '123', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpxe9pt1nu'] +INFO - Job 123: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499511f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002814Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002814Z +20221111/us-east-1/s3/aws4_request +c36c9b9c3b75f11ee308dfd63e8addc917034430c7c3dc2a2144760628aedda4 +INFO - '2022-11-11' - botocore.auth - Signature: +317af2e9879229d52081d551f3c0191f69c3bec35ae4e044a0302aac96ca2427 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'yIKSbv7DxYyornCsl0qbw2ucIQH6zaMl2kURVr3lEg2SceRhkhDarknLyB75OXV5R+BLwPi0ULU=', 'x-amz-request-id': '4N1R34W7YN4TGS9P', 'Date': 'Fri, 11 Nov 2022 00:28:14 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180312T000000, start_date=20221111T002813, end_date=20221111T002815 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-03-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:28:15.669183Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "281a03dc-7a31-40dd-8244-893b60d5fe46"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..8c5b664b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:28:08.693054Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d901add2-505f-363f-bdbe-c85dcab4f316"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d901add2-505f-363f-bdbe-c85dcab4f316"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c0b365b4-40cc-427d-91a8-af4f400d89ab"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-03-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:28:08.693054+00:00, try_number=1, job_id=121, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-12 00:00:00+00:00 +INFO - Started process 767 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-03-12T00:00:00+00:00', '--job-id', '121', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpzx32whnx'] +INFO - Job 121: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180312T000000, start_date=20221111T002808, end_date=20221111T002814 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-03-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:28:14.077172Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c0b365b4-40cc-427d-91a8-af4f400d89ab"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..91b4f963 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:28:08.695049Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d901add2-505f-363f-bdbe-c85dcab4f316"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d901add2-505f-363f-bdbe-c85dcab4f316"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6a943abf-ba6a-4cca-8e97-88cc2370eee0"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-03-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:28:08.695049+00:00, try_number=1, job_id=122, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-12 00:00:00+00:00 +INFO - Started process 763 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-03-12T00:00:00+00:00', '--job-id', '122', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpx68nvpz6'] +INFO - Job 122: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180312T000000, start_date=20221111T002808, end_date=20221111T002812 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-03-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:28:12.281504Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6a943abf-ba6a-4cca-8e97-88cc2370eee0"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..dd52c526 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:28:18.683341Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7bdc1d8b-e86b-3ee4-bc30-dd4cd9a2e494"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7bdc1d8b-e86b-3ee4-bc30-dd4cd9a2e494"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7b0fe863-ae87-42c9-9406-3dbaaf80c16d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-03-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:28:18.683341+00:00, try_number=1, job_id=126, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-13 00:00:00+00:00 +INFO - Started process 842 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-03-13T00:00:00+00:00', '--job-id', '126', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpcvg_q_b8'] +INFO - Job 126: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180313T000000, start_date=20221111T002818, end_date=20221111T002821 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-03-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:28:21.271323Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7b0fe863-ae87-42c9-9406-3dbaaf80c16d"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..a2a1f2bc --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:28:18.667114Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7bdc1d8b-e86b-3ee4-bc30-dd4cd9a2e494"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7bdc1d8b-e86b-3ee4-bc30-dd4cd9a2e494"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0b7da6c5-bd48-45dd-a87e-5689a24b2212"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-03-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:28:18.667114+00:00, try_number=1, job_id=125, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-13 00:00:00+00:00 +INFO - Started process 839 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-03-13T00:00:00+00:00', '--job-id', '125', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp7fuggfcg'] +INFO - Job 125: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180313T000000, start_date=20221111T002818, end_date=20221111T002821 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-03-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:28:21.366921Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0b7da6c5-bd48-45dd-a87e-5689a24b2212"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..af3482cf --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:28:27.267840Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7bdc1d8b-e86b-3ee4-bc30-dd4cd9a2e494"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7bdc1d8b-e86b-3ee4-bc30-dd4cd9a2e494"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bf93135f-95f9-42fe-9a7e-bfe1b689388e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-03-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:28:27.267840+00:00, try_number=1, job_id=130, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-13 00:00:00+00:00 +INFO - Started process 817 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-03-13T00:00:00+00:00', '--job-id', '130', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpv4to0i0x'] +INFO - Job 130: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498ee940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'QwdEfNJsyPkSoVaIkYO84w==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:QwdEfNJsyPkSoVaIkYO84w== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002827Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002827Z +20221111/us-east-1/s3/aws4_request +3339441a5484642ce52e2a04bfc131540690afda11f0ae91a4334d50346050a4 +INFO - '2022-11-11' - botocore.auth - Signature: +3d5f94c1b7605b51dc4a9ac9fb77b90b1d8227fa318eec00c15ee6f801eb0571 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'jRkv4mDUirKOAhe7nWMyshMgQn8YBr0zXx++NfBKQ5jII0k8dWad4D/ASKMbeQV42sHlkNkD7p0=', 'x-amz-request-id': 'F13S91J076Z9KB8K', 'Date': 'Fri, 11 Nov 2022 00:28:28 GMT', 'ETag': '"4307447cd26cc8f912a156889183bce3"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180313T000000, start_date=20221111T002827, end_date=20221111T002829 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-03-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:28:29.408041Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bf93135f-95f9-42fe-9a7e-bfe1b689388e"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..63f54d26 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:28:26.638702Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7bdc1d8b-e86b-3ee4-bc30-dd4cd9a2e494"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7bdc1d8b-e86b-3ee4-bc30-dd4cd9a2e494"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1cee09b4-d354-4cac-a67b-53a416b5e892"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-03-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:28:26.638702+00:00, try_number=1, job_id=129, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-13 00:00:00+00:00 +INFO - Started process 848 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-03-13T00:00:00+00:00', '--job-id', '129', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpv6w1s1gi'] +INFO - Job 129: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002827Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002827Z +20221111/us-east-1/s3/aws4_request +25bb10e17d2cfb53c8f5a02bf947e25d9a03d4915de6ee763d41b2a4fd8a80b5 +INFO - '2022-11-11' - botocore.auth - Signature: +f58a45530969c14310837fa6ad601d547cfd57b95455a101e91585403d9d865f +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '4Z7vQ7EsSc6jEH0xFXnCFOpKl556jFwyEEKKmi/lBWj4Ax7hKjOlJUuvvT72WGV4FVBFzKDuLZE=', 'x-amz-request-id': 'F13J713B7N0J24R5', 'Date': 'Fri, 11 Nov 2022 00:28:28 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180313T000000, start_date=20221111T002826, end_date=20221111T002828 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-03-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:28:28.896943Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1cee09b4-d354-4cac-a67b-53a416b5e892"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..68143fec --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:28:22.444276Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7bdc1d8b-e86b-3ee4-bc30-dd4cd9a2e494"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7bdc1d8b-e86b-3ee4-bc30-dd4cd9a2e494"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b4eef749-681b-48aa-adb4-8b288a1ea363"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-03-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:28:22.444276+00:00, try_number=1, job_id=128, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-13 00:00:00+00:00 +INFO - Started process 811 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-03-13T00:00:00+00:00', '--job-id', '128', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpsfbpq9wj'] +INFO - Job 128: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180313T000000, start_date=20221111T002822, end_date=20221111T002825 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-03-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:28:25.726427Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b4eef749-681b-48aa-adb4-8b288a1ea363"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..64aef8de --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:28:22.437013Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7bdc1d8b-e86b-3ee4-bc30-dd4cd9a2e494"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7bdc1d8b-e86b-3ee4-bc30-dd4cd9a2e494"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3aafd557-b58f-4988-8e05-3bdaa713c3d7"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-03-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:28:22.437013+00:00, try_number=1, job_id=127, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-13 00:00:00+00:00 +INFO - Started process 810 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-03-13T00:00:00+00:00', '--job-id', '127', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpezogo8m5'] +INFO - Job 127: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180313T000000, start_date=20221111T002822, end_date=20221111T002824 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-03-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:28:24.866719Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3aafd557-b58f-4988-8e05-3bdaa713c3d7"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..65971558 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:28:31.593444Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2f187929-3867-3d9b-b108-d204ac8fe02e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2f187929-3867-3d9b-b108-d204ac8fe02e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cd8593b4-7e1b-4d86-b1be-f5bee0f6f8ba"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-03-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:28:31.593444+00:00, try_number=1, job_id=132, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-14 00:00:00+00:00 +INFO - Started process 859 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-03-14T00:00:00+00:00', '--job-id', '132', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpgkbgx0_6'] +INFO - Job 132: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180314T000000, start_date=20221111T002831, end_date=20221111T002834 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-03-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:28:34.081900Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cd8593b4-7e1b-4d86-b1be-f5bee0f6f8ba"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..88c9e883 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:28:31.581657Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2f187929-3867-3d9b-b108-d204ac8fe02e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2f187929-3867-3d9b-b108-d204ac8fe02e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "808d7c56-56e1-4343-94d5-beb3d6cc7f6d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-03-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:28:31.581657+00:00, try_number=1, job_id=131, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-14 00:00:00+00:00 +INFO - Started process 858 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-03-14T00:00:00+00:00', '--job-id', '131', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp8lbawyh9'] +INFO - Job 131: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180314T000000, start_date=20221111T002831, end_date=20221111T002834 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-03-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:28:34.136026Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "808d7c56-56e1-4343-94d5-beb3d6cc7f6d"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..43ad6532 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:28:47.588357Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2f187929-3867-3d9b-b108-d204ac8fe02e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2f187929-3867-3d9b-b108-d204ac8fe02e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5bb89904-a356-4f6f-8a9f-60a78fea1665"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-03-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:28:47.588357+00:00, try_number=1, job_id=136, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-14 00:00:00+00:00 +INFO - Started process 889 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-03-14T00:00:00+00:00', '--job-id', '136', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp3zn5is1_'] +INFO - Job 136: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498eff70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'QwdEfNJsyPkSoVaIkYO84w==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:QwdEfNJsyPkSoVaIkYO84w== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002848Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002848Z +20221111/us-east-1/s3/aws4_request +8ba8e3b747b3cf707a6eb20c45223ad13661d4fdb52f9d6df21e35fa24699283 +INFO - '2022-11-11' - botocore.auth - Signature: +7340d1afe41d78063fe184b2e33f992f91f9f54dd8d5c418cbf6aa5e1cfe93be +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'BBrvBlAK+/y2z6eYcOOoHqOYuOKFyUYCSMzcZF8HskrvfawDhOGZbn2tYjTTr7zUvmGfVLPot/o=', 'x-amz-request-id': '71988PDY2QEAK44A', 'Date': 'Fri, 11 Nov 2022 00:28:48 GMT', 'ETag': '"4307447cd26cc8f912a156889183bce3"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180314T000000, start_date=20221111T002847, end_date=20221111T002849 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-03-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:28:49.394478Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5bb89904-a356-4f6f-8a9f-60a78fea1665"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..532ad70b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:28:43.060223Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2f187929-3867-3d9b-b108-d204ac8fe02e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2f187929-3867-3d9b-b108-d204ac8fe02e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a6217f7d-4e18-4e2d-9acb-41c66b64d157"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-03-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:28:43.060223+00:00, try_number=1, job_id=135, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-14 00:00:00+00:00 +INFO - Started process 939 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-03-14T00:00:00+00:00', '--job-id', '135', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmppi4vle_8'] +INFO - Job 135: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50071f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002844Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002844Z +20221111/us-east-1/s3/aws4_request +01c93dd5dfa91a1ba656ff1af5f16c05e455798a966c32efa71628509f3e191b +INFO - '2022-11-11' - botocore.auth - Signature: +498d4832deb4ee72c10bcc965e064491625040245e0ecc3ba80abd5f99efdfc5 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'P1qEG0ltxxp1hciBBCUgy6TBXnFS6+iQWdnDilDJiRbS5hTqbmzfvkTmnt1/11WuQK6gw11d2PU=', 'x-amz-request-id': 'WMJ5K10YXR8PCZSE', 'Date': 'Fri, 11 Nov 2022 00:28:45 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180314T000000, start_date=20221111T002843, end_date=20221111T002846 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-03-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:28:46.130751Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a6217f7d-4e18-4e2d-9acb-41c66b64d157"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..f67dc4b2 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:28:35.831235Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2f187929-3867-3d9b-b108-d204ac8fe02e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2f187929-3867-3d9b-b108-d204ac8fe02e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "49f431da-6953-4a3f-8976-a2f9b43c0e35"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-03-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:28:35.831235+00:00, try_number=1, job_id=133, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-14 00:00:00+00:00 +INFO - Started process 879 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-03-14T00:00:00+00:00', '--job-id', '133', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmppxmf7qr2'] +INFO - Job 133: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180314T000000, start_date=20221111T002835, end_date=20221111T002845 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-03-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:28:45.764630Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "49f431da-6953-4a3f-8976-a2f9b43c0e35"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..de94b143 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:28:35.891479Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2f187929-3867-3d9b-b108-d204ac8fe02e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2f187929-3867-3d9b-b108-d204ac8fe02e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "89f97595-f4a5-4020-8b89-f48725be1936"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-03-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:28:35.891479+00:00, try_number=1, job_id=134, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-14 00:00:00+00:00 +INFO - Started process 884 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-03-14T00:00:00+00:00', '--job-id', '134', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpd7tfzrf8'] +INFO - Job 134: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180314T000000, start_date=20221111T002835, end_date=20221111T002839 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-03-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:28:39.202706Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "89f97595-f4a5-4020-8b89-f48725be1936"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..f0100428 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:28:51.747043Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "640d4b0e-6166-3b26-8369-0bf6602df4ba"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "640d4b0e-6166-3b26-8369-0bf6602df4ba"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "55a3c35d-d3c8-4e4b-a88f-6cd4b844b348"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-03-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:28:51.747043+00:00, try_number=1, job_id=138, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-15 00:00:00+00:00 +INFO - Started process 900 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-03-15T00:00:00+00:00', '--job-id', '138', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpzhg0d3zm'] +INFO - Job 138: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180315T000000, start_date=20221111T002851, end_date=20221111T002854 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-03-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:28:54.873857Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "55a3c35d-d3c8-4e4b-a88f-6cd4b844b348"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..740f1ad2 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:28:51.695872Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "640d4b0e-6166-3b26-8369-0bf6602df4ba"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "640d4b0e-6166-3b26-8369-0bf6602df4ba"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "78abb819-c301-4b9b-aeec-7b1fe64c3e41"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-03-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:28:51.695872+00:00, try_number=1, job_id=137, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-15 00:00:00+00:00 +INFO - Started process 897 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-03-15T00:00:00+00:00', '--job-id', '137', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp814gz_z4'] +INFO - Job 137: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180315T000000, start_date=20221111T002851, end_date=20221111T002854 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-03-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:28:54.879913Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "78abb819-c301-4b9b-aeec-7b1fe64c3e41"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..ed3167aa --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:29:03.165760Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "640d4b0e-6166-3b26-8369-0bf6602df4ba"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "640d4b0e-6166-3b26-8369-0bf6602df4ba"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "83261184-9a4d-4a40-b5de-65ecfcccade0"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-03-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:29:03.165760+00:00, try_number=1, job_id=142, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-15 00:00:00+00:00 +INFO - Started process 953 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-03-15T00:00:00+00:00', '--job-id', '142', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp7rdrzmdf'] +INFO - Job 142: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'l7rYouMpAqqHpfYjrW4K/Q==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:l7rYouMpAqqHpfYjrW4K/Q== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002903Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002903Z +20221111/us-east-1/s3/aws4_request +25adcaa824100c5526fa724bfa4325ffb6e1538ad8dbb4ae7339c88190f628ed +INFO - '2022-11-11' - botocore.auth - Signature: +525a966622bdff39c5376cd1a6c1faf693a82343d7748073a3fdfcabc278f925 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'hAAXxuk7p8A4avE1DL+vsJU5mr9gN80VtDxKs+IOJt4/zrmc5NF2SCjy20yDzohHjOPPwlCF5Xo=', 'x-amz-request-id': 'DN5SJQG2JMDGW3RB', 'Date': 'Fri, 11 Nov 2022 00:29:04 GMT', 'ETag': '"97bad8a2e32902aa87a5f623ad6e0afd"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180315T000000, start_date=20221111T002903, end_date=20221111T002904 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-03-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:29:04.832737Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "83261184-9a4d-4a40-b5de-65ecfcccade0"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..4a44ad83 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:29:01.857685Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "640d4b0e-6166-3b26-8369-0bf6602df4ba"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "640d4b0e-6166-3b26-8369-0bf6602df4ba"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5f6ef1ad-fbe6-4248-887f-aa5856e14989"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-03-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:29:01.857685+00:00, try_number=1, job_id=141, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-15 00:00:00+00:00 +INFO - Started process 948 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-03-15T00:00:00+00:00', '--job-id', '141', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpgrhmndsw'] +INFO - Job 141: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5ca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002902Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002902Z +20221111/us-east-1/s3/aws4_request +5f3062b2e3d3f76c02e09bb486bcad17e12fbe2662968b6584efca31141b239e +INFO - '2022-11-11' - botocore.auth - Signature: +5fe386d9ffe84eb9fa6f627bf6a149fdf707129ed59f0fa1f8288f0c2e908e4d +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'ZeMzu4T7zOqiRYoSYBitYNRzGOmFjutsGpTag1h41TUDv7Bpzdl+T+mze/mik/zkwCTu07ktiBU=', 'x-amz-request-id': '66FN6WNF6CJ6QFAD', 'Date': 'Fri, 11 Nov 2022 00:29:03 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180315T000000, start_date=20221111T002901, end_date=20221111T002903 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-03-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:29:03.697085Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5f6ef1ad-fbe6-4248-887f-aa5856e14989"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..982862d9 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:28:57.418270Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "640d4b0e-6166-3b26-8369-0bf6602df4ba"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "640d4b0e-6166-3b26-8369-0bf6602df4ba"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "92b19c3a-9e93-4c91-afb6-7b5b07418ad2"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-03-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:28:57.418270+00:00, try_number=1, job_id=140, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-15 00:00:00+00:00 +INFO - Started process 910 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-03-15T00:00:00+00:00', '--job-id', '140', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp1q0yfcvp'] +INFO - Job 140: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180315T000000, start_date=20221111T002857, end_date=20221111T002901 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-03-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:29:01.465927Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "92b19c3a-9e93-4c91-afb6-7b5b07418ad2"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..200bfa19 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:28:57.392107Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "640d4b0e-6166-3b26-8369-0bf6602df4ba"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "640d4b0e-6166-3b26-8369-0bf6602df4ba"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "609cb054-cb5a-4128-b197-c3742e903301"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-03-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:28:57.392107+00:00, try_number=1, job_id=139, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-15 00:00:00+00:00 +INFO - Started process 909 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-03-15T00:00:00+00:00', '--job-id', '139', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpyhnp7byq'] +INFO - Job 139: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180315T000000, start_date=20221111T002857, end_date=20221111T002900 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-03-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:29:00.504992Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "609cb054-cb5a-4128-b197-c3742e903301"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..0776470a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:29:06.595339Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "02338500-870c-3e0a-abb4-964a3a3efa49"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "02338500-870c-3e0a-abb4-964a3a3efa49"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cf969616-cf4a-463a-ba0d-4fd75e5dec10"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-03-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:29:06.595339+00:00, try_number=1, job_id=144, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-16 00:00:00+00:00 +INFO - Started process 935 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-03-16T00:00:00+00:00', '--job-id', '144', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpg948il1s'] +INFO - Job 144: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180316T000000, start_date=20221111T002906, end_date=20221111T002909 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-03-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:29:09.220787Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cf969616-cf4a-463a-ba0d-4fd75e5dec10"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..be8529fb --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:29:06.570426Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "02338500-870c-3e0a-abb4-964a3a3efa49"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "02338500-870c-3e0a-abb4-964a3a3efa49"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0010db4c-274c-4bab-a231-1a0c3d3b4f64"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-03-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:29:06.570426+00:00, try_number=1, job_id=143, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-16 00:00:00+00:00 +INFO - Started process 927 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-03-16T00:00:00+00:00', '--job-id', '143', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpglg8v2aw'] +INFO - Job 143: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180316T000000, start_date=20221111T002906, end_date=20221111T002909 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-03-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:29:09.222907Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0010db4c-274c-4bab-a231-1a0c3d3b4f64"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..bc8ec328 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:29:17.971517Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "02338500-870c-3e0a-abb4-964a3a3efa49"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "02338500-870c-3e0a-abb4-964a3a3efa49"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "41add93e-a769-4f21-9aa5-27602b30cce3"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-03-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:29:17.971517+00:00, try_number=1, job_id=148, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-16 00:00:00+00:00 +INFO - Started process 1036 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-03-16T00:00:00+00:00', '--job-id', '148', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpf61fkx5q'] +INFO - Job 148: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6ca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'vUfjsporO6oLfz9iwZAZ+g==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:vUfjsporO6oLfz9iwZAZ+g== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002918Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002918Z +20221111/us-east-1/s3/aws4_request +ecfc6c4c1acf8faddeb70eb231a3fe300a25a77be8b6c8fa8959e2414a645bcd +INFO - '2022-11-11' - botocore.auth - Signature: +8bb8a4d9fccd496e168a1a3628f9e514c5fa128e0eda9df2f69a3e85b9f55b8a +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'QVirjI0NsLFXDpMjuAgxwZ5eJ4bQsjFuxQUAvt8W0TAZzVn9TnPGg7Ra7ebDkZp4ByBuo0ewsvw=', 'x-amz-request-id': '1Q7ZVEW4V4PE92BN', 'Date': 'Fri, 11 Nov 2022 00:29:19 GMT', 'ETag': '"bd47e3b29a2b3baa0b7f3f62c19019fa"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180316T000000, start_date=20221111T002917, end_date=20221111T002919 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-03-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:29:19.732282Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "41add93e-a769-4f21-9aa5-27602b30cce3"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..0c232597 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:29:16.459893Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "02338500-870c-3e0a-abb4-964a3a3efa49"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "02338500-870c-3e0a-abb4-964a3a3efa49"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "762b591e-085d-468b-9aed-c018ad37977f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-03-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:29:16.459893+00:00, try_number=1, job_id=147, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-16 00:00:00+00:00 +INFO - Started process 991 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-03-16T00:00:00+00:00', '--job-id', '147', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmppnmkj5bd'] +INFO - Job 147: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499543a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002917Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002917Z +20221111/us-east-1/s3/aws4_request +52a3c0ed3ae1f8af41909e2082e480d0eef0e9aa72b01c7bfe0791dfcce58ad9 +INFO - '2022-11-11' - botocore.auth - Signature: +19b0c67a5e4728cda3476cef4a89f26024c7707da7605c21cb390432d72a6b76 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'V+ltwRtfsc/2uHegyiJPzd0bqieIQSFO6huPWcsI9oHBCv/7xerAcSD4z+CwcBXteZbS4eB98qs=', 'x-amz-request-id': 'XH9G69M0Q6MEYZVZ', 'Date': 'Fri, 11 Nov 2022 00:29:17 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180316T000000, start_date=20221111T002916, end_date=20221111T002918 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-03-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:29:18.092873Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "762b591e-085d-468b-9aed-c018ad37977f"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..bf8db548 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:29:11.433331Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "02338500-870c-3e0a-abb4-964a3a3efa49"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "02338500-870c-3e0a-abb4-964a3a3efa49"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "64012ccf-d3ad-4c91-abac-d152d7b92fd8"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-03-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:29:11.433331+00:00, try_number=1, job_id=145, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-16 00:00:00+00:00 +INFO - Started process 1004 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-03-16T00:00:00+00:00', '--job-id', '145', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp7u850krf'] +INFO - Job 145: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180316T000000, start_date=20221111T002911, end_date=20221111T002916 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-03-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:29:16.584764Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "64012ccf-d3ad-4c91-abac-d152d7b92fd8"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..1fa5ccce --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:29:11.438925Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "02338500-870c-3e0a-abb4-964a3a3efa49"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "02338500-870c-3e0a-abb4-964a3a3efa49"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4fd2e0ea-4a0e-48a1-8fc0-407aa02dad98"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-03-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:29:11.438925+00:00, try_number=1, job_id=146, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-16 00:00:00+00:00 +INFO - Started process 1006 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-03-16T00:00:00+00:00', '--job-id', '146', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmplz_mveg7'] +INFO - Job 146: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180316T000000, start_date=20221111T002911, end_date=20221111T002914 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-03-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:29:14.909347Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4fd2e0ea-4a0e-48a1-8fc0-407aa02dad98"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..f6677621 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:29:22.172817Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c84b4f95-0534-33db-ada2-cee28fe95e0b"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c84b4f95-0534-33db-ada2-cee28fe95e0b"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b5bc34b3-6bb2-4805-ae45-75ab7736287d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-03-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:29:22.172817+00:00, try_number=1, job_id=149, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-17 00:00:00+00:00 +INFO - Started process 1045 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-03-17T00:00:00+00:00', '--job-id', '149', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpkh4co4dh'] +INFO - Job 149: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180317T000000, start_date=20221111T002922, end_date=20221111T002925 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-03-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:29:25.291996Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b5bc34b3-6bb2-4805-ae45-75ab7736287d"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..c757d368 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:29:22.183803Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c84b4f95-0534-33db-ada2-cee28fe95e0b"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c84b4f95-0534-33db-ada2-cee28fe95e0b"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a9918ab6-0d91-4876-95dd-0b93a1461ace"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-03-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:29:22.183803+00:00, try_number=1, job_id=150, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-17 00:00:00+00:00 +INFO - Started process 1047 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-03-17T00:00:00+00:00', '--job-id', '150', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpvyhwo1_7'] +INFO - Job 150: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180317T000000, start_date=20221111T002922, end_date=20221111T002925 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-03-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:29:25.293762Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a9918ab6-0d91-4876-95dd-0b93a1461ace"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..1fb4bc31 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:29:32.685730Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c84b4f95-0534-33db-ada2-cee28fe95e0b"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c84b4f95-0534-33db-ada2-cee28fe95e0b"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b8befa76-9cf0-4473-9be9-a4e662efa9ee"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-03-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:29:32.685730+00:00, try_number=1, job_id=154, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-17 00:00:00+00:00 +INFO - Started process 1059 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-03-17T00:00:00+00:00', '--job-id', '154', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpkx74jux9'] +INFO - Job 154: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6ee0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'vUfjsporO6oLfz9iwZAZ+g==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:vUfjsporO6oLfz9iwZAZ+g== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002933Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002933Z +20221111/us-east-1/s3/aws4_request +ee3268fccccb782b8800022df2379e58d92b446daad61b71027830b9ba7cad23 +INFO - '2022-11-11' - botocore.auth - Signature: +6b822e78c35176ab61e97855ae944d83d9714f8cf7724096648fda5b7bad6f5d +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'jBKIq/gIp9HJWqSVKDJOKmzLCLNGLf3jisJHUzuVlUPup6V0UMRmA4EPEsAqVylzDMZYbaCiMiA=', 'x-amz-request-id': '0TE7X90GKARZER46', 'Date': 'Fri, 11 Nov 2022 00:29:33 GMT', 'ETag': '"bd47e3b29a2b3baa0b7f3f62c19019fa"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180317T000000, start_date=20221111T002932, end_date=20221111T002934 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-03-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:29:34.594698Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b8befa76-9cf0-4473-9be9-a4e662efa9ee"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..1fbe9d0c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:29:31.221162Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c84b4f95-0534-33db-ada2-cee28fe95e0b"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c84b4f95-0534-33db-ada2-cee28fe95e0b"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "92d132c6-14a3-4053-a548-e3a23717c1f8"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-03-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:29:31.221162+00:00, try_number=1, job_id=153, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-17 00:00:00+00:00 +INFO - Started process 1054 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-03-17T00:00:00+00:00', '--job-id', '153', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpvil61pm2'] +INFO - Job 153: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002932Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002932Z +20221111/us-east-1/s3/aws4_request +2abc90d1ba4af02aecb92db792dc46dea963e812a6be0b7edee499f79bb08534 +INFO - '2022-11-11' - botocore.auth - Signature: +72da6ff40b28ee37d13852886c88b0b4b30d2dcdccf44585ff459154a845c289 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'RcbL0ZIKdRjoU+S4RG/E8K5w9kj15+9/VS8M/Tp0ypwGGETGtffEC8vb6922bzgbokxQHOsraBE4b0BJimCYnw==', 'x-amz-request-id': '0TE538K493MNQ06B', 'Date': 'Fri, 11 Nov 2022 00:29:33 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180317T000000, start_date=20221111T002931, end_date=20221111T002933 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-03-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:29:33.970839Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "92d132c6-14a3-4053-a548-e3a23717c1f8"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..df55811b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:29:26.871090Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c84b4f95-0534-33db-ada2-cee28fe95e0b"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c84b4f95-0534-33db-ada2-cee28fe95e0b"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cf64e990-f9ad-4008-9429-2f8a99ca5ce6"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-03-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:29:26.871090+00:00, try_number=1, job_id=152, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-17 00:00:00+00:00 +INFO - Started process 1000 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-03-17T00:00:00+00:00', '--job-id', '152', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmptcn9dmez'] +INFO - Job 152: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180317T000000, start_date=20221111T002926, end_date=20221111T002930 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-03-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:29:30.827441Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cf64e990-f9ad-4008-9429-2f8a99ca5ce6"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..e5383f1f --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:29:26.874306Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c84b4f95-0534-33db-ada2-cee28fe95e0b"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c84b4f95-0534-33db-ada2-cee28fe95e0b"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fdd06cdf-daf6-4944-851c-81d9215e86be"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-03-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:29:26.874306+00:00, try_number=1, job_id=151, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-17 00:00:00+00:00 +INFO - Started process 1002 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-03-17T00:00:00+00:00', '--job-id', '151', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmporwot_94'] +INFO - Job 151: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180317T000000, start_date=20221111T002926, end_date=20221111T002929 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-03-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:29:29.734946Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fdd06cdf-daf6-4944-851c-81d9215e86be"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..0ae5c878 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:29:36.453095Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f407a6e6-a80e-3b34-9410-9610b742476d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f407a6e6-a80e-3b34-9410-9610b742476d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "927788ce-6e5a-4c1a-b97c-0f072d727686"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-03-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:29:36.453095+00:00, try_number=1, job_id=156, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-18 00:00:00+00:00 +INFO - Started process 1077 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-03-18T00:00:00+00:00', '--job-id', '156', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp62oopdha'] +INFO - Job 156: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180318T000000, start_date=20221111T002936, end_date=20221111T002940 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-03-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:29:40.043028Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "927788ce-6e5a-4c1a-b97c-0f072d727686"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..bb7d2508 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:29:36.460348Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f407a6e6-a80e-3b34-9410-9610b742476d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f407a6e6-a80e-3b34-9410-9610b742476d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5c19cbd2-e981-4538-904b-53f0b1cabcec"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-03-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:29:36.460348+00:00, try_number=1, job_id=155, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-18 00:00:00+00:00 +INFO - Started process 1084 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-03-18T00:00:00+00:00', '--job-id', '155', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpdv0j1iup'] +INFO - Job 155: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180318T000000, start_date=20221111T002936, end_date=20221111T002940 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-03-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:29:40.038877Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5c19cbd2-e981-4538-904b-53f0b1cabcec"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..d9502e66 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:29:48.584349Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f407a6e6-a80e-3b34-9410-9610b742476d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f407a6e6-a80e-3b34-9410-9610b742476d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3b51e1dc-d1a4-426b-b03f-5a46d59c7201"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-03-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:29:48.584349+00:00, try_number=1, job_id=160, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-18 00:00:00+00:00 +INFO - Started process 1089 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-03-18T00:00:00+00:00', '--job-id', '160', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpl219leli'] +INFO - Job 160: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'UENt2MPXdim5v0BzUvBLyg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:UENt2MPXdim5v0BzUvBLyg== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002949Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002949Z +20221111/us-east-1/s3/aws4_request +a8739a3ebf1f8d90777a7a4f74f42d6df224b29783279ef0d37be9b77ca6c79d +INFO - '2022-11-11' - botocore.auth - Signature: +b72f0997aee5c6fa3243f6b072fa22daa42f105f403ef2cb12ab723cafc3d364 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'x5TPcbySAKn/mlP/eQB+ZicmRFU4nDXcIrE3LOn/EQCFflD5K2xXTMhxoFjvgPlHKsj1k2FyBYNYxhSLhKcbaQ==', 'x-amz-request-id': 'HJJ2B6W9NN6JRN04', 'Date': 'Fri, 11 Nov 2022 00:29:49 GMT', 'ETag': '"50436dd8c3d77629b9bf407352f04bca"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180318T000000, start_date=20221111T002948, end_date=20221111T002950 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-03-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:29:50.030157Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3b51e1dc-d1a4-426b-b03f-5a46d59c7201"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..7bace554 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:29:46.476157Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f407a6e6-a80e-3b34-9410-9610b742476d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f407a6e6-a80e-3b34-9410-9610b742476d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0760b81a-f8db-4e8a-9b69-8f04aae1d585"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-03-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:29:46.476157+00:00, try_number=1, job_id=159, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-18 00:00:00+00:00 +INFO - Started process 1080 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-03-18T00:00:00+00:00', '--job-id', '159', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp5rhpy8n6'] +INFO - Job 159: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499531f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T002947Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T002947Z +20221111/us-east-1/s3/aws4_request +db3c634555b9f97af876d4426e1dccdb230b2f5c0425adfc3bfc13a5bc26c297 +INFO - '2022-11-11' - botocore.auth - Signature: +5e0a5963546b6cbe6cd084be11dd2657db3a8c46638a538d98292218c8e58368 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'jEoyUsBOHcM9A4oJHIHbr565PC1ZEjdxPQGjK8ied5LyvvAKntFaETLD7XnQCHXCqsTGO3hBNynUfpAqXlz3iQ==', 'x-amz-request-id': 'PQP4G5VVNWXHVSE8', 'Date': 'Fri, 11 Nov 2022 00:29:48 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180318T000000, start_date=20221111T002946, end_date=20221111T002948 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-03-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:29:48.708257Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0760b81a-f8db-4e8a-9b69-8f04aae1d585"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..0753aaf1 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:29:42.027393Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f407a6e6-a80e-3b34-9410-9610b742476d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f407a6e6-a80e-3b34-9410-9610b742476d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d9b9af43-05c3-4493-889d-c02be77ac8fd"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-03-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:29:42.027393+00:00, try_number=1, job_id=157, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-18 00:00:00+00:00 +INFO - Started process 1061 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-03-18T00:00:00+00:00', '--job-id', '157', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpt6qvxjjl'] +INFO - Job 157: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180318T000000, start_date=20221111T002942, end_date=20221111T002947 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-03-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:29:47.229525Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d9b9af43-05c3-4493-889d-c02be77ac8fd"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..931a2f12 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:29:42.038939Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f407a6e6-a80e-3b34-9410-9610b742476d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f407a6e6-a80e-3b34-9410-9610b742476d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "70ec57d5-62a2-4c3b-b85b-55b99eb10fa9"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-03-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:29:42.038939+00:00, try_number=1, job_id=158, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-18 00:00:00+00:00 +INFO - Started process 1062 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-03-18T00:00:00+00:00', '--job-id', '158', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmperwx13ky'] +INFO - Job 158: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180318T000000, start_date=20221111T002942, end_date=20221111T002945 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-03-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:29:45.032476Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "70ec57d5-62a2-4c3b-b85b-55b99eb10fa9"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..b063fc03 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:29:52.638766Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "87d91b1b-c7eb-3c51-ac38-1fc672425379"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "87d91b1b-c7eb-3c51-ac38-1fc672425379"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "dfcffc62-4163-4c91-808e-0ffbbb9f6d32"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-03-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:29:52.638766+00:00, try_number=1, job_id=161, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-19 00:00:00+00:00 +INFO - Started process 1098 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-03-19T00:00:00+00:00', '--job-id', '161', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpwfao_el6'] +INFO - Job 161: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180319T000000, start_date=20221111T002952, end_date=20221111T002955 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-03-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:29:55.966498Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "dfcffc62-4163-4c91-808e-0ffbbb9f6d32"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..f5c456b9 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:29:53.794907Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "87d91b1b-c7eb-3c51-ac38-1fc672425379"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "87d91b1b-c7eb-3c51-ac38-1fc672425379"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cc265fd5-3517-4ca4-821b-86a5a3354b09"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-03-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:29:53.794907+00:00, try_number=1, job_id=162, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-19 00:00:00+00:00 +INFO - Started process 1101 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-03-19T00:00:00+00:00', '--job-id', '162', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpmazp7gq4'] +INFO - Job 162: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180319T000000, start_date=20221111T002953, end_date=20221111T002956 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-03-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:29:56.875058Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cc265fd5-3517-4ca4-821b-86a5a3354b09"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..4d85f32a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:30:05.783803Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "87d91b1b-c7eb-3c51-ac38-1fc672425379"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "87d91b1b-c7eb-3c51-ac38-1fc672425379"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5606023f-9cce-4e48-bddf-aa1e1eed8c37"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-03-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:30:05.783803+00:00, try_number=1, job_id=166, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-19 00:00:00+00:00 +INFO - Started process 1117 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-03-19T00:00:00+00:00', '--job-id', '166', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpxa6eksyy'] +INFO - Job 166: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'rJiTVFUqRQQf6+KWacRH1A==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:rJiTVFUqRQQf6+KWacRH1A== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003006Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003006Z +20221111/us-east-1/s3/aws4_request +435e93a6290aae93f6e67cabc52fe30d8d12a9e6c574dfdc3437f8cb16bebf34 +INFO - '2022-11-11' - botocore.auth - Signature: +79465aaca705ab8c2644781c41ce9df2202e22d6b45bae92a60cd42a292162a6 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'Mbjjm+6XTzSGnEA/DfjdDG1AwuKa9qn4dPIodIieRfCevq0ALUWKL4UcO3Y1zdjYv2VA3cBAlEs=', 'x-amz-request-id': 'F8AR6CXADN0EVHTC', 'Date': 'Fri, 11 Nov 2022 00:30:07 GMT', 'ETag': '"ac989354552a45041febe29669c447d4"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180319T000000, start_date=20221111T003005, end_date=20221111T003007 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-03-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:30:07.726068Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5606023f-9cce-4e48-bddf-aa1e1eed8c37"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..888c914b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:30:03.748089Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "87d91b1b-c7eb-3c51-ac38-1fc672425379"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "87d91b1b-c7eb-3c51-ac38-1fc672425379"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9c69b686-82ec-446b-a66b-9bb0924ef286"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-03-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:30:03.748089+00:00, try_number=1, job_id=165, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-19 00:00:00+00:00 +INFO - Started process 1142 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-03-19T00:00:00+00:00', '--job-id', '165', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpvm3swbz2'] +INFO - Job 165: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50083a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003004Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003004Z +20221111/us-east-1/s3/aws4_request +29dd6000ee2ce2bde0ad4e3886cf169ea5763a022330016c3bb5d4d5d4bdae4c +INFO - '2022-11-11' - botocore.auth - Signature: +41b42df821082ebe101f1b371ee727439021287877de988a4478cc0c09008d55 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'lfuBcz8hehlQUrly3C5D4ToS2mrM8aYCT3CdXRdeg5c4h81tj/ghXAq9UOfnbcSwmJmz9omYPnY=', 'x-amz-request-id': 'DKYAYJ2XYTV9VTWK', 'Date': 'Fri, 11 Nov 2022 00:30:04 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180319T000000, start_date=20221111T003003, end_date=20221111T003005 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-03-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:30:05.609725Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9c69b686-82ec-446b-a66b-9bb0924ef286"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..64f28d53 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:29:58.608526Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "87d91b1b-c7eb-3c51-ac38-1fc672425379"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "87d91b1b-c7eb-3c51-ac38-1fc672425379"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "42088f13-24b7-423e-a4be-a68c7b4f6899"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-03-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:29:58.608526+00:00, try_number=1, job_id=163, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-19 00:00:00+00:00 +INFO - Started process 1108 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-03-19T00:00:00+00:00', '--job-id', '163', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpjp69k9ze'] +INFO - Job 163: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180319T000000, start_date=20221111T002958, end_date=20221111T003003 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-03-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:30:03.803152Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "42088f13-24b7-423e-a4be-a68c7b4f6899"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..69ea85e5 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:29:58.796206Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "87d91b1b-c7eb-3c51-ac38-1fc672425379"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "87d91b1b-c7eb-3c51-ac38-1fc672425379"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "49332761-cb96-4e3f-9657-7ae173a60477"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-03-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:29:58.796206+00:00, try_number=1, job_id=164, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-19 00:00:00+00:00 +INFO - Started process 1111 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-03-19T00:00:00+00:00', '--job-id', '164', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp2d7ud01o'] +INFO - Job 164: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180319T000000, start_date=20221111T002958, end_date=20221111T003002 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-03-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:30:02.149823Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "49332761-cb96-4e3f-9657-7ae173a60477"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..9344bcc4 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:30:09.897491Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3d0486cf-3a81-3ce6-8de0-d6662a7decff"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3d0486cf-3a81-3ce6-8de0-d6662a7decff"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0bcfade5-41c2-40a8-a10a-9a1dc9fe4763"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-03-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:30:09.897491+00:00, try_number=1, job_id=167, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-20 00:00:00+00:00 +INFO - Started process 1178 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-03-20T00:00:00+00:00', '--job-id', '167', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpjptk_a_b'] +INFO - Job 167: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180320T000000, start_date=20221111T003009, end_date=20221111T003013 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-03-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:30:13.581377Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0bcfade5-41c2-40a8-a10a-9a1dc9fe4763"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..b03ebd3c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:30:09.892283Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3d0486cf-3a81-3ce6-8de0-d6662a7decff"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3d0486cf-3a81-3ce6-8de0-d6662a7decff"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5b5be012-b92f-40cc-a2ee-0c53338f2031"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-03-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:30:09.892283+00:00, try_number=1, job_id=168, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-20 00:00:00+00:00 +INFO - Started process 1175 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-03-20T00:00:00+00:00', '--job-id', '168', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp2mgicl47'] +INFO - Job 168: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180320T000000, start_date=20221111T003009, end_date=20221111T003013 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-03-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:30:13.510021Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5b5be012-b92f-40cc-a2ee-0c53338f2031"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..311fe5b2 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:30:23.326567Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3d0486cf-3a81-3ce6-8de0-d6662a7decff"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3d0486cf-3a81-3ce6-8de0-d6662a7decff"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f32826fe-4165-498f-9c50-9ef97bbfc60d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-03-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:30:23.326567+00:00, try_number=1, job_id=172, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-20 00:00:00+00:00 +INFO - Started process 1189 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-03-20T00:00:00+00:00', '--job-id', '172', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpxkc__f58'] +INFO - Job 172: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498efca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'rJiTVFUqRQQf6+KWacRH1A==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:rJiTVFUqRQQf6+KWacRH1A== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003024Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003024Z +20221111/us-east-1/s3/aws4_request +3622e5d9582d49848db96c31c693accf99eef9cbd02ebd9a2fd48aeb95671d10 +INFO - '2022-11-11' - botocore.auth - Signature: +05caa5ea5d8a46423914ee96dbe73206e06b19b97a3f5c4e4e6389fdffa31e8a +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'JPbFunAn0dJRaCvcwgU+vFh7Lohog+NCk1KgcjonFDiELbmoszmQpH7R3Cp8LX0ek09ugMT4338=', 'x-amz-request-id': 'EC31VZ43GYDE55RR', 'Date': 'Fri, 11 Nov 2022 00:30:24 GMT', 'ETag': '"ac989354552a45041febe29669c447d4"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180320T000000, start_date=20221111T003023, end_date=20221111T003025 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-03-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:30:25.205953Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f32826fe-4165-498f-9c50-9ef97bbfc60d"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..00b840d0 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:30:20.705703Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3d0486cf-3a81-3ce6-8de0-d6662a7decff"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3d0486cf-3a81-3ce6-8de0-d6662a7decff"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "74c01b48-95fa-41d9-8cf7-d05077b5eace"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-03-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:30:20.705703+00:00, try_number=1, job_id=171, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-20 00:00:00+00:00 +INFO - Started process 1233 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-03-20T00:00:00+00:00', '--job-id', '171', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpgj12yjfm'] +INFO - Job 171: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50071f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003021Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003021Z +20221111/us-east-1/s3/aws4_request +3cc6b3c8e1cd44e55db38958db45608d19819a0a298ad9b92d6012d987e49108 +INFO - '2022-11-11' - botocore.auth - Signature: +54b21bebfcdcfba7953b9e32960c888270bd2c2220455862b07effadd68780a0 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'R4JrqyNoaaaDEMT0qdta/GBXxr+oQEhPaVc6yn0kLxK8h6BBiNYgInvfCzODPp6Ybm2xDUgbmJY=', 'x-amz-request-id': 'C8VBR22GS56MMAW3', 'Date': 'Fri, 11 Nov 2022 00:30:22 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180320T000000, start_date=20221111T003020, end_date=20221111T003023 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-03-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:30:23.041668Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "74c01b48-95fa-41d9-8cf7-d05077b5eace"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..5ef3a77c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:30:16.628153Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3d0486cf-3a81-3ce6-8de0-d6662a7decff"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3d0486cf-3a81-3ce6-8de0-d6662a7decff"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "45c89738-abcd-4709-9176-0ef62400cef1"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-03-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:30:16.628153+00:00, try_number=1, job_id=170, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-20 00:00:00+00:00 +INFO - Started process 1226 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-03-20T00:00:00+00:00', '--job-id', '170', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpwgvs5rw_'] +INFO - Job 170: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180320T000000, start_date=20221111T003016, end_date=20221111T003021 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-03-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:30:21.895842Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "45c89738-abcd-4709-9176-0ef62400cef1"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..8ed5f476 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:30:15.749056Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3d0486cf-3a81-3ce6-8de0-d6662a7decff"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3d0486cf-3a81-3ce6-8de0-d6662a7decff"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5aeb653c-9e35-4a00-ad58-d328f495cf54"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-03-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:30:15.749056+00:00, try_number=1, job_id=169, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-20 00:00:00+00:00 +INFO - Started process 1220 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-03-20T00:00:00+00:00', '--job-id', '169', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpassj40nb'] +INFO - Job 169: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180320T000000, start_date=20221111T003015, end_date=20221111T003019 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-03-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:30:19.183839Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5aeb653c-9e35-4a00-ad58-d328f495cf54"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..5085c638 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:30:26.788414Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2324835d-b05f-3646-bd05-c81cba3d71c2"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2324835d-b05f-3646-bd05-c81cba3d71c2"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0172a890-6ab9-4759-8d23-afb674c7a5fe"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-03-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:30:26.788414+00:00, try_number=1, job_id=173, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-21 00:00:00+00:00 +INFO - Started process 1243 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-03-21T00:00:00+00:00', '--job-id', '173', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpu73gdmkb'] +INFO - Job 173: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180321T000000, start_date=20221111T003026, end_date=20221111T003029 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-03-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:30:29.571668Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0172a890-6ab9-4759-8d23-afb674c7a5fe"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..f2eb31c8 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:30:26.840371Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2324835d-b05f-3646-bd05-c81cba3d71c2"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2324835d-b05f-3646-bd05-c81cba3d71c2"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d65cdf42-25b4-4b45-aa3f-1baf598bfe0d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-03-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:30:26.840371+00:00, try_number=1, job_id=174, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-21 00:00:00+00:00 +INFO - Started process 1245 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-03-21T00:00:00+00:00', '--job-id', '174', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpru28nxj9'] +INFO - Job 174: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180321T000000, start_date=20221111T003026, end_date=20221111T003029 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-03-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:30:29.644730Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d65cdf42-25b4-4b45-aa3f-1baf598bfe0d"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..b7db84ab --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:30:36.617204Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2324835d-b05f-3646-bd05-c81cba3d71c2"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2324835d-b05f-3646-bd05-c81cba3d71c2"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1450487b-13a6-4df9-8c28-b0db0bb28094"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-03-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:30:36.617204+00:00, try_number=1, job_id=178, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-21 00:00:00+00:00 +INFO - Started process 1202 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-03-21T00:00:00+00:00', '--job-id', '178', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmplx4lg1r5'] +INFO - Job 178: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'rJiTVFUqRQQf6+KWacRH1A==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:rJiTVFUqRQQf6+KWacRH1A== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003037Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003037Z +20221111/us-east-1/s3/aws4_request +cb0250a7fa80db03c4ec533d9a2ee6e7b585b7146018a2af0b5489a8495cd01d +INFO - '2022-11-11' - botocore.auth - Signature: +dd98eb03d81cc71f7a305ccecbe1133dff63f2a6eaa6b1126dfb51842f7c3d5d +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '6AUhtaT+hXlaF76C5ikJ2QLvv6JiECqOeojtiFvs4SzILZIJOY69iXxzYT3bnVrquHd7aAKmXxI=', 'x-amz-request-id': 'ZRW4CWEEVRQSSJAR', 'Date': 'Fri, 11 Nov 2022 00:30:37 GMT', 'ETag': '"ac989354552a45041febe29669c447d4"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180321T000000, start_date=20221111T003036, end_date=20221111T003038 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-03-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:30:38.500628Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1450487b-13a6-4df9-8c28-b0db0bb28094"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..37d96621 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:30:35.296773Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2324835d-b05f-3646-bd05-c81cba3d71c2"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2324835d-b05f-3646-bd05-c81cba3d71c2"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "520e373e-f721-47b5-88b9-ee2e2caa012d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-03-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:30:35.296773+00:00, try_number=1, job_id=177, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-21 00:00:00+00:00 +INFO - Started process 1197 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-03-21T00:00:00+00:00', '--job-id', '177', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpcttupeby'] +INFO - Job 177: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498ef940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003035Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003035Z +20221111/us-east-1/s3/aws4_request +c6489612bf98a7bd71bb41196c5809353aa6e17bd141ade9de205d98d7add685 +INFO - '2022-11-11' - botocore.auth - Signature: +9736291c2e48442a78c946ab6ca8fbbe10f7d95ed9c34e352d5c426312af556d +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'ACFvyVlt0WfVe08jGRQdsqrW6IUastmyv+fCmPezvrHlpiJevty3SK9UBKVvjeqoN7u2/Ym6vUk=', 'x-amz-request-id': 'P4E72W0AXNYSJHHX', 'Date': 'Fri, 11 Nov 2022 00:30:36 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180321T000000, start_date=20221111T003035, end_date=20221111T003037 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-03-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:30:37.325767Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "520e373e-f721-47b5-88b9-ee2e2caa012d"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..64650c8b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:30:30.817548Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2324835d-b05f-3646-bd05-c81cba3d71c2"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2324835d-b05f-3646-bd05-c81cba3d71c2"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8dd35fd1-14cc-4e7d-8acb-27459e0003c9"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-03-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:30:30.817548+00:00, try_number=1, job_id=175, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-21 00:00:00+00:00 +INFO - Started process 1252 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-03-21T00:00:00+00:00', '--job-id', '175', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpmoq30515'] +INFO - Job 175: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180321T000000, start_date=20221111T003030, end_date=20221111T003034 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-03-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:30:34.919963Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8dd35fd1-14cc-4e7d-8acb-27459e0003c9"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..ecfb904f --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:30:30.964589Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2324835d-b05f-3646-bd05-c81cba3d71c2"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2324835d-b05f-3646-bd05-c81cba3d71c2"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3671ea8b-97c5-4527-ad28-e3ddd9441a71"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-03-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:30:30.964589+00:00, try_number=1, job_id=176, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-21 00:00:00+00:00 +INFO - Started process 1255 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-03-21T00:00:00+00:00', '--job-id', '176', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpz92ohmo5'] +INFO - Job 176: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180321T000000, start_date=20221111T003030, end_date=20221111T003033 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-03-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:30:33.810052Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3671ea8b-97c5-4527-ad28-e3ddd9441a71"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..bd8c5a8c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:30:40.627900Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "57bbe424-c8b3-3f89-9135-302935eea21a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "57bbe424-c8b3-3f89-9135-302935eea21a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "12f95006-1a54-4586-aca4-8e300523315a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-03-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:30:40.627900+00:00, try_number=1, job_id=179, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-22 00:00:00+00:00 +INFO - Started process 1290 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-03-22T00:00:00+00:00', '--job-id', '179', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp_m1x9x2s'] +INFO - Job 179: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180322T000000, start_date=20221111T003040, end_date=20221111T003043 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-03-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:30:43.868515Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "12f95006-1a54-4586-aca4-8e300523315a"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..1c85a80b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:30:40.626475Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "57bbe424-c8b3-3f89-9135-302935eea21a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "57bbe424-c8b3-3f89-9135-302935eea21a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "304bfb4a-85ad-4e3c-b5c3-b459abe274c5"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-03-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:30:40.626475+00:00, try_number=1, job_id=180, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-22 00:00:00+00:00 +INFO - Started process 1288 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-03-22T00:00:00+00:00', '--job-id', '180', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpgd8ofosd'] +INFO - Job 180: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180322T000000, start_date=20221111T003040, end_date=20221111T003043 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-03-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:30:43.849111Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "304bfb4a-85ad-4e3c-b5c3-b459abe274c5"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..e460ef4c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:30:55.556179Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "57bbe424-c8b3-3f89-9135-302935eea21a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "57bbe424-c8b3-3f89-9135-302935eea21a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ce3332de-9cf4-44a5-85cb-b64daa29297d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-03-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:30:55.556179+00:00, try_number=1, job_id=184, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-22 00:00:00+00:00 +INFO - Started process 1346 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-03-22T00:00:00+00:00', '--job-id', '184', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp4yjmqcci'] +INFO - Job 184: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'JYiTgWd2ss974r/kgvIdvA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:JYiTgWd2ss974r/kgvIdvA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003056Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003056Z +20221111/us-east-1/s3/aws4_request +35bab9d047b04f8d67d2afc7669138dce3f3cce97cf07802ef091f67121d6545 +INFO - '2022-11-11' - botocore.auth - Signature: +4e170dbf5bc142839a27fff78c9a42e489cb81a9592cae7be09204406a21f32d +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'bOpW/Ep8ZFKEGtfmRDzSqk/+9vB9yfN+nl7CKVsdlSxXQACe7IwmBeNO+t7QlMiSxzWtRsO/GrE=', 'x-amz-request-id': 'MEGSYVTECXT1CDQW', 'Date': 'Fri, 11 Nov 2022 00:30:56 GMT', 'ETag': '"258893816776b2cf7be2bfe482f21dbc"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180322T000000, start_date=20221111T003055, end_date=20221111T003057 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-03-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:30:57.495291Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ce3332de-9cf4-44a5-85cb-b64daa29297d"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..a7a54d9c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:30:51.374251Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "57bbe424-c8b3-3f89-9135-302935eea21a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "57bbe424-c8b3-3f89-9135-302935eea21a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "958c8040-3298-48e0-b0b9-db0c67e1cf02"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-03-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:30:51.374251+00:00, try_number=1, job_id=183, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-22 00:00:00+00:00 +INFO - Started process 1263 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-03-22T00:00:00+00:00', '--job-id', '183', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp49b7iim9'] +INFO - Job 183: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f6249954550> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003053Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003053Z +20221111/us-east-1/s3/aws4_request +8132ff725387761954c9fd6200f9b050fcc13e938522b7353efc47b6a1160b10 +INFO - '2022-11-11' - botocore.auth - Signature: +3196216352c8965a4f14bc19c861fcf6e354b55b02c44ca19f6aebae03927a55 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'h1H7CRm71XoWDeAxmQ7viUDB/AEx4/3aTaRMo88bTdKKO+/DSzUBCjf+wLjFjRwCb64COs/grZU=', 'x-amz-request-id': 'ATK6E5SFNM1GH3DR', 'Date': 'Fri, 11 Nov 2022 00:30:53 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180322T000000, start_date=20221111T003051, end_date=20221111T003054 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-03-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:30:54.371493Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "958c8040-3298-48e0-b0b9-db0c67e1cf02"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..b7ce48c7 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:30:46.288520Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "57bbe424-c8b3-3f89-9135-302935eea21a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "57bbe424-c8b3-3f89-9135-302935eea21a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f5cbde38-6ac7-4a06-833c-4551bf8ee276"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-03-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:30:46.288520+00:00, try_number=1, job_id=181, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-22 00:00:00+00:00 +INFO - Started process 1334 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-03-22T00:00:00+00:00', '--job-id', '181', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpv0jeu0ga'] +INFO - Job 181: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180322T000000, start_date=20221111T003046, end_date=20221111T003054 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-03-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:30:54.079659Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f5cbde38-6ac7-4a06-833c-4551bf8ee276"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..fb66b9cf --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:30:46.303710Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "57bbe424-c8b3-3f89-9135-302935eea21a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "57bbe424-c8b3-3f89-9135-302935eea21a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9663f7f1-bae8-493f-bbf6-3dae43425a78"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-03-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:30:46.303710+00:00, try_number=1, job_id=182, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-22 00:00:00+00:00 +INFO - Started process 1335 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-03-22T00:00:00+00:00', '--job-id', '182', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmph1ou2cs3'] +INFO - Job 182: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180322T000000, start_date=20221111T003046, end_date=20221111T003049 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-03-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:30:49.163421Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9663f7f1-bae8-493f-bbf6-3dae43425a78"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..38aeeff4 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:30:59.704040Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42300d10-c4d1-3aa8-901d-840d453c14cb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42300d10-c4d1-3aa8-901d-840d453c14cb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5f4c02c0-2854-48aa-8a71-679942411453"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-03-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:30:59.704040+00:00, try_number=1, job_id=185, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-23 00:00:00+00:00 +INFO - Started process 1357 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-03-23T00:00:00+00:00', '--job-id', '185', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpm52t4g0m'] +INFO - Job 185: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-23T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180323T000000, start_date=20221111T003059, end_date=20221111T003102 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-03-23T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:31:02.897023Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5f4c02c0-2854-48aa-8a71-679942411453"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..d7811692 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:30:59.704742Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42300d10-c4d1-3aa8-901d-840d453c14cb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42300d10-c4d1-3aa8-901d-840d453c14cb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bfd626fc-a749-4380-8eea-7876508cd362"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-03-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:30:59.704742+00:00, try_number=1, job_id=186, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-23 00:00:00+00:00 +INFO - Started process 1356 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-03-23T00:00:00+00:00', '--job-id', '186', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp1msnvhmg'] +INFO - Job 186: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-23T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180323T000000, start_date=20221111T003059, end_date=20221111T003102 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-03-23T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:31:02.909626Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bfd626fc-a749-4380-8eea-7876508cd362"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..d32c2aca --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:31:10.551641Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42300d10-c4d1-3aa8-901d-840d453c14cb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42300d10-c4d1-3aa8-901d-840d453c14cb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cec06faa-f141-42d3-8b2e-d62907369374"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-03-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:31:10.551641+00:00, try_number=1, job_id=190, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-23 00:00:00+00:00 +INFO - Started process 1389 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-03-23T00:00:00+00:00', '--job-id', '190', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpmtd3bvb3'] +INFO - Job 190: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-23T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6ee0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'JYiTgWd2ss974r/kgvIdvA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:JYiTgWd2ss974r/kgvIdvA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003111Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003111Z +20221111/us-east-1/s3/aws4_request +4361043b5033d2bb7727525722996a58525f70ce24b5e1b3e571cd7dbd7bd9e8 +INFO - '2022-11-11' - botocore.auth - Signature: +836fe4092eb76761328dcf45fbad0d4bce5a78ef48d936c0c8f195baf23dc0d6 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'bs3/600VgWQ3y0NlFgU9lUdEocfkQcVfVm33HnJhspKNI1CetEonXV6mk2hmNmML1MztjMXKHeE=', 'x-amz-request-id': 'B2DQC6YWPK28ZBJR', 'Date': 'Fri, 11 Nov 2022 00:31:12 GMT', 'ETag': '"258893816776b2cf7be2bfe482f21dbc"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180323T000000, start_date=20221111T003110, end_date=20221111T003114 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-03-23T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:31:14.692285Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cec06faa-f141-42d3-8b2e-d62907369374"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..3c5c93de --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:31:08.934992Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42300d10-c4d1-3aa8-901d-840d453c14cb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42300d10-c4d1-3aa8-901d-840d453c14cb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1f0fa1ca-aa2c-432f-88cc-ed2108f9994d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-03-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:31:08.934992+00:00, try_number=1, job_id=189, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-23 00:00:00+00:00 +INFO - Started process 1374 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-03-23T00:00:00+00:00', '--job-id', '189', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmph1cp0k5g'] +INFO - Job 189: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-23T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003109Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003109Z +20221111/us-east-1/s3/aws4_request +0219208c3a1ec8f44a5a78b0858945e334ef9f10f77f42365f22d2bdbd0549c9 +INFO - '2022-11-11' - botocore.auth - Signature: +3945e25111d819a718dd2271e9c2a03fb986fb5c21a93acce014e83ec499b23e +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'WUnw4lrP0I7Wu/odz3fD+Uk92F/msNPSoy7BOJTpYmv1w36a34IHlbobicbYsWTkmwmEwxorQ60=', 'x-amz-request-id': 'H56W8TVFH1FDG5W0', 'Date': 'Fri, 11 Nov 2022 00:31:10 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180323T000000, start_date=20221111T003108, end_date=20221111T003111 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-03-23T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:31:11.590227Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1f0fa1ca-aa2c-432f-88cc-ed2108f9994d"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..41d0c575 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:31:04.743342Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42300d10-c4d1-3aa8-901d-840d453c14cb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42300d10-c4d1-3aa8-901d-840d453c14cb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8bc578d1-699c-4b38-9c63-6b1d0ac2c0e6"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-03-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:31:04.743342+00:00, try_number=1, job_id=187, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-23 00:00:00+00:00 +INFO - Started process 1285 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-03-23T00:00:00+00:00', '--job-id', '187', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpm38ia27s'] +INFO - Job 187: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-23T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180323T000000, start_date=20221111T003104, end_date=20221111T003108 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-03-23T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:31:08.816390Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8bc578d1-699c-4b38-9c63-6b1d0ac2c0e6"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..f6954eca --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:31:04.770148Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42300d10-c4d1-3aa8-901d-840d453c14cb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42300d10-c4d1-3aa8-901d-840d453c14cb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cf169208-c31d-4a81-a7e7-5c9b8840eddb"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-03-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:31:04.770148+00:00, try_number=1, job_id=188, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-23 00:00:00+00:00 +INFO - Started process 1286 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-03-23T00:00:00+00:00', '--job-id', '188', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpjo6o_spr'] +INFO - Job 188: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-23T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180323T000000, start_date=20221111T003104, end_date=20221111T003107 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-03-23T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:31:07.772480Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cf169208-c31d-4a81-a7e7-5c9b8840eddb"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..d1c14f9d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:31:16.072577Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7d7208c7-9581-37a2-8736-1b18dd783754"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7d7208c7-9581-37a2-8736-1b18dd783754"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f894b39e-497b-4b27-bdff-59b472524bbe"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-03-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:31:16.072577+00:00, try_number=1, job_id=191, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-24 00:00:00+00:00 +INFO - Started process 1294 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-03-24T00:00:00+00:00', '--job-id', '191', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpkz3lf3t5'] +INFO - Job 191: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-24T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180324T000000, start_date=20221111T003116, end_date=20221111T003119 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-03-24T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:31:19.253187Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f894b39e-497b-4b27-bdff-59b472524bbe"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..dacfb030 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:31:16.170778Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7d7208c7-9581-37a2-8736-1b18dd783754"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7d7208c7-9581-37a2-8736-1b18dd783754"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "651a198c-7a46-4541-aa92-b3f01b899115"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-03-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:31:16.170778+00:00, try_number=1, job_id=192, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-24 00:00:00+00:00 +INFO - Started process 1296 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-03-24T00:00:00+00:00', '--job-id', '192', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpwxid53wm'] +INFO - Job 192: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-24T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180324T000000, start_date=20221111T003116, end_date=20221111T003119 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-03-24T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:31:19.249320Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "651a198c-7a46-4541-aa92-b3f01b899115"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..1518137d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:31:27.519895Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7d7208c7-9581-37a2-8736-1b18dd783754"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7d7208c7-9581-37a2-8736-1b18dd783754"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e0c3932b-3053-4993-a7c0-c01ace2dd0e4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-03-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:31:27.519895+00:00, try_number=1, job_id=196, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-24 00:00:00+00:00 +INFO - Started process 1448 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-03-24T00:00:00+00:00', '--job-id', '196', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp4hbc2tkv'] +INFO - Job 196: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-24T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'JYiTgWd2ss974r/kgvIdvA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:JYiTgWd2ss974r/kgvIdvA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003128Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003128Z +20221111/us-east-1/s3/aws4_request +5402a03c94152ce31e26b1175b51184d36b98492af142a0928ceba89b6f45f80 +INFO - '2022-11-11' - botocore.auth - Signature: +580be238b9052d7cf1b04af2f72ea4ad51d8364eda4b48c2f4a9ec8800568265 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'FrrRL8pV4kbEbRfLnuXJCll0XrIpiigrcyumGHEcd6b22NEDRY17DZfQ/vdIQPSLA8rLEFFJ8/I=', 'x-amz-request-id': 'THKVT0G1R35RNV6E', 'Date': 'Fri, 11 Nov 2022 00:31:28 GMT', 'ETag': '"258893816776b2cf7be2bfe482f21dbc"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180324T000000, start_date=20221111T003127, end_date=20221111T003129 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-03-24T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:31:29.378586Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e0c3932b-3053-4993-a7c0-c01ace2dd0e4"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..af899c89 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:31:26.152080Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7d7208c7-9581-37a2-8736-1b18dd783754"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7d7208c7-9581-37a2-8736-1b18dd783754"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "22a79c38-90e4-4c81-82e3-d9e920e4e885"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-03-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:31:26.152080+00:00, try_number=1, job_id=195, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-24 00:00:00+00:00 +INFO - Started process 1443 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-03-24T00:00:00+00:00', '--job-id', '195', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpwpium1hs'] +INFO - Job 195: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-24T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa4ca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003126Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003126Z +20221111/us-east-1/s3/aws4_request +6f283c8ad188e66acdf6bf207ebb067c10dc96a891b1092a9c7a174a661da029 +INFO - '2022-11-11' - botocore.auth - Signature: +9a87af2119eecbfc609698269ca66e2fdffe359feadac9397a452ab62df5acae +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '7X6QYN71wIpIh+SdyQE0w00PXnJq+oxdIZCVG1UM6Dzxq5Fcex0KXavjIe4CSwQOlBOR9ZA9iVk=', 'x-amz-request-id': '1109XG4M6Q9JKH9E', 'Date': 'Fri, 11 Nov 2022 00:31:27 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180324T000000, start_date=20221111T003126, end_date=20221111T003128 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-03-24T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:31:28.271026Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "22a79c38-90e4-4c81-82e3-d9e920e4e885"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..59045c1b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:31:21.602897Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7d7208c7-9581-37a2-8736-1b18dd783754"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7d7208c7-9581-37a2-8736-1b18dd783754"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "04dbf8e4-6d4b-47c7-beac-357cb12bf87a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-03-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:31:21.602897+00:00, try_number=1, job_id=193, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-24 00:00:00+00:00 +INFO - Started process 1336 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-03-24T00:00:00+00:00', '--job-id', '193', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpgncumia6'] +INFO - Job 193: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-24T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180324T000000, start_date=20221111T003121, end_date=20221111T003125 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-03-24T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:31:25.475545Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "04dbf8e4-6d4b-47c7-beac-357cb12bf87a"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..4011967d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:31:21.637921Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7d7208c7-9581-37a2-8736-1b18dd783754"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7d7208c7-9581-37a2-8736-1b18dd783754"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6f7548be-3409-49ce-b57b-33ddc63b6821"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-03-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:31:21.637921+00:00, try_number=1, job_id=194, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-24 00:00:00+00:00 +INFO - Started process 1337 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-03-24T00:00:00+00:00', '--job-id', '194', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp_pleio8b'] +INFO - Job 194: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-24T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180324T000000, start_date=20221111T003121, end_date=20221111T003124 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-03-24T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:31:24.686002Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6f7548be-3409-49ce-b57b-33ddc63b6821"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..b340f77f --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:31:32.022601Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c89dbb0d-fa1e-3ef8-a96c-42ca77127ef0"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c89dbb0d-fa1e-3ef8-a96c-42ca77127ef0"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "aed39e94-b909-4d59-9f78-b99ffe93a257"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-03-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:31:32.022601+00:00, try_number=1, job_id=198, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-25 00:00:00+00:00 +INFO - Started process 1380 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-03-25T00:00:00+00:00', '--job-id', '198', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpeqf5noal'] +INFO - Job 198: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-25T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180325T000000, start_date=20221111T003132, end_date=20221111T003134 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-03-25T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:31:34.901233Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "aed39e94-b909-4d59-9f78-b99ffe93a257"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..07076b2c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:31:32.023792Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c89dbb0d-fa1e-3ef8-a96c-42ca77127ef0"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c89dbb0d-fa1e-3ef8-a96c-42ca77127ef0"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d6f25e01-d83f-421e-b9ca-3169bc994a6d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-03-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:31:32.023792+00:00, try_number=1, job_id=197, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-25 00:00:00+00:00 +INFO - Started process 1381 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-03-25T00:00:00+00:00', '--job-id', '197', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp77ntaq48'] +INFO - Job 197: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-25T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180325T000000, start_date=20221111T003132, end_date=20221111T003134 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-03-25T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:31:34.906356Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d6f25e01-d83f-421e-b9ca-3169bc994a6d"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..e42be253 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:31:42.843453Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c89dbb0d-fa1e-3ef8-a96c-42ca77127ef0"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c89dbb0d-fa1e-3ef8-a96c-42ca77127ef0"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8b82fe59-e321-44a3-9316-5c3955b27cc6"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-03-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:31:42.843453+00:00, try_number=1, job_id=202, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-25 00:00:00+00:00 +INFO - Started process 1393 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-03-25T00:00:00+00:00', '--job-id', '202', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpqtgpuq59'] +INFO - Job 202: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-25T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498eff70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'O2XafWKvUNfl5U6thiuSQg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:O2XafWKvUNfl5U6thiuSQg== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003143Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003143Z +20221111/us-east-1/s3/aws4_request +3cae311a44544c668e5e80008df808ef959df5e5b823e2b34811f6444f759e7f +INFO - '2022-11-11' - botocore.auth - Signature: +2c06666565a529b5a4b58dc24523c4c146da2ef2839a1e196332f2b12003c1a4 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'jfDl9RlFYhMKCLph+wQBFPAr99x7HB11hbZPF6w2Rh5TLx+pjSsoEsJ6xHGoBFIfaZz/CiIzI4k=', 'x-amz-request-id': 'RAYJW8PAG0M0HF5M', 'Date': 'Fri, 11 Nov 2022 00:31:44 GMT', 'ETag': '"3b65da7d62af50d7e5e54ead862b9242"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180325T000000, start_date=20221111T003142, end_date=20221111T003145 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-03-25T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:31:45.093783Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8b82fe59-e321-44a3-9316-5c3955b27cc6"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..c06a2582 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:31:41.400535Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c89dbb0d-fa1e-3ef8-a96c-42ca77127ef0"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c89dbb0d-fa1e-3ef8-a96c-42ca77127ef0"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "08545d38-5740-46c0-bbcf-84cb9ae2c0a1"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-03-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:31:41.400535+00:00, try_number=1, job_id=201, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-25 00:00:00+00:00 +INFO - Started process 1388 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-03-25T00:00:00+00:00', '--job-id', '201', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpay5q_ykm'] +INFO - Job 201: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-25T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003142Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003142Z +20221111/us-east-1/s3/aws4_request +c5b0689947d10d34a590ef3961b04dae743a23a63445b30302809213e17f608f +INFO - '2022-11-11' - botocore.auth - Signature: +41f383c22ff2555e5c1d16d70ae66cf84c20b7df72fff3b9476f4ab190ec1493 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'qXxVGi6aaDkToDB5DScJFjKee+OiSKP9OGD6+srout4uUk10uUgNRlunyDyKX8+AuPEEPOiW0aA=', 'x-amz-request-id': '7MTJJZCDMN7A4J78', 'Date': 'Fri, 11 Nov 2022 00:31:43 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180325T000000, start_date=20221111T003141, end_date=20221111T003143 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-03-25T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:31:43.891352Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "08545d38-5740-46c0-bbcf-84cb9ae2c0a1"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..25eba128 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:31:36.395847Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c89dbb0d-fa1e-3ef8-a96c-42ca77127ef0"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c89dbb0d-fa1e-3ef8-a96c-42ca77127ef0"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9f52f73d-fe45-4fc9-8bb7-f46aeda94d88"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-03-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:31:36.395847+00:00, try_number=1, job_id=200, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-25 00:00:00+00:00 +INFO - Started process 1460 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-03-25T00:00:00+00:00', '--job-id', '200', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp27873gan'] +INFO - Job 200: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-25T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180325T000000, start_date=20221111T003136, end_date=20221111T003140 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-03-25T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:31:40.289974Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9f52f73d-fe45-4fc9-8bb7-f46aeda94d88"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..531cab6f --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:31:36.370220Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c89dbb0d-fa1e-3ef8-a96c-42ca77127ef0"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c89dbb0d-fa1e-3ef8-a96c-42ca77127ef0"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "709fe7cb-121a-4fbb-870d-36ef370b7044"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-03-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:31:36.370220+00:00, try_number=1, job_id=199, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-25 00:00:00+00:00 +INFO - Started process 1459 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-03-25T00:00:00+00:00', '--job-id', '199', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp7hlx_qk8'] +INFO - Job 199: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-25T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180325T000000, start_date=20221111T003136, end_date=20221111T003139 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-03-25T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:31:39.495969Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "709fe7cb-121a-4fbb-870d-36ef370b7044"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..cf30e8b6 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:31:47.589816Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5d24ca33-be4c-3301-adfe-94a31266c0f3"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5d24ca33-be4c-3301-adfe-94a31266c0f3"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "52ed1585-1743-4a8a-9441-745269418f90"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-03-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:31:47.589816+00:00, try_number=1, job_id=204, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-26 00:00:00+00:00 +INFO - Started process 1405 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-03-26T00:00:00+00:00', '--job-id', '204', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpdq17mplw'] +INFO - Job 204: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-26T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180326T000000, start_date=20221111T003147, end_date=20221111T003150 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-03-26T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:31:50.352507Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "52ed1585-1743-4a8a-9441-745269418f90"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..d58bd206 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:31:47.463815Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5d24ca33-be4c-3301-adfe-94a31266c0f3"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5d24ca33-be4c-3301-adfe-94a31266c0f3"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0b80eb2d-c041-4b7f-b871-cdd0770b16da"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-03-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:31:47.463815+00:00, try_number=1, job_id=203, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-26 00:00:00+00:00 +INFO - Started process 1402 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-03-26T00:00:00+00:00', '--job-id', '203', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpw17fbevp'] +INFO - Job 203: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-26T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180326T000000, start_date=20221111T003147, end_date=20221111T003150 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-03-26T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:31:50.320912Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0b80eb2d-c041-4b7f-b871-cdd0770b16da"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..0cd1550c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:31:58.794355Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5d24ca33-be4c-3301-adfe-94a31266c0f3"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5d24ca33-be4c-3301-adfe-94a31266c0f3"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b542dcec-c557-4a40-9bf2-1a8d081218d6"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-03-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:31:58.794355+00:00, try_number=1, job_id=208, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-26 00:00:00+00:00 +INFO - Started process 1482 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-03-26T00:00:00+00:00', '--job-id', '208', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpks6lm9b7'] +INFO - Job 208: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-26T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498eff70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'O2XafWKvUNfl5U6thiuSQg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:O2XafWKvUNfl5U6thiuSQg== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003159Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003159Z +20221111/us-east-1/s3/aws4_request +078e4dad3e00d263a5e9b17c3842ce88bba54e3d1167e4e26686f109df10e10f +INFO - '2022-11-11' - botocore.auth - Signature: +1263a1f08c6b2df3dd8988607db56ab7e0a4929ab2d7ef6195cb9f7505b59ac6 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'aERn4lN5ivCRlPqxwes9DwhfpMnuV9qN1q0VphcMph/0ECZmGcCX3yWLL2KrjijLZIqmYjuFkTY=', 'x-amz-request-id': '6VZDGVHK9M2VZV1W', 'Date': 'Fri, 11 Nov 2022 00:32:00 GMT', 'ETag': '"3b65da7d62af50d7e5e54ead862b9242"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180326T000000, start_date=20221111T003158, end_date=20221111T003200 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-03-26T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:32:00.672620Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b542dcec-c557-4a40-9bf2-1a8d081218d6"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..660725d4 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:31:57.284829Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5d24ca33-be4c-3301-adfe-94a31266c0f3"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5d24ca33-be4c-3301-adfe-94a31266c0f3"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "206333fd-1c18-4580-a368-e27796e12077"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-03-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:31:57.284829+00:00, try_number=1, job_id=207, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-26 00:00:00+00:00 +INFO - Started process 1477 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-03-26T00:00:00+00:00', '--job-id', '207', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp1az4__3s'] +INFO - Job 207: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-26T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498eff70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003158Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003158Z +20221111/us-east-1/s3/aws4_request +206616af0f8604c9b5d87af9c31bf8016bf5bdba4742e57aa8a7d4b37e05c6a8 +INFO - '2022-11-11' - botocore.auth - Signature: +5d6e343894fe2c653eb9aa9f977ddefa3b6a436659672779806494b91e24bfcc +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'QPwOJoEoqiBtAB6yFtPYHA6fg0Eq7pIxjRZu9ZCLSIvUeCqiO5BA53BGIsD4gyY/sEMR+mGBWdg=', 'x-amz-request-id': 'GKANF6483612W7Z5', 'Date': 'Fri, 11 Nov 2022 00:31:58 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180326T000000, start_date=20221111T003157, end_date=20221111T003159 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-03-26T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:31:59.464470Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "206333fd-1c18-4580-a368-e27796e12077"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..a501f068 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:31:52.452768Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5d24ca33-be4c-3301-adfe-94a31266c0f3"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5d24ca33-be4c-3301-adfe-94a31266c0f3"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9aa5526f-e0db-46b0-856e-cb8e23f5bbbc"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-03-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:31:52.452768+00:00, try_number=1, job_id=206, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-26 00:00:00+00:00 +INFO - Started process 1535 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-03-26T00:00:00+00:00', '--job-id', '206', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp4vnlypw3'] +INFO - Job 206: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-26T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180326T000000, start_date=20221111T003152, end_date=20221111T003157 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-03-26T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:31:57.057264Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9aa5526f-e0db-46b0-856e-cb8e23f5bbbc"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..96a92a88 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:31:52.366741Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5d24ca33-be4c-3301-adfe-94a31266c0f3"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5d24ca33-be4c-3301-adfe-94a31266c0f3"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e64d5ed8-02a4-4f81-986e-893a849e4070"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-03-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:31:52.366741+00:00, try_number=1, job_id=205, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-26 00:00:00+00:00 +INFO - Started process 1533 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-03-26T00:00:00+00:00', '--job-id', '205', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp1fdumht0'] +INFO - Job 205: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-26T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180326T000000, start_date=20221111T003152, end_date=20221111T003155 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-03-26T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:31:55.878526Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e64d5ed8-02a4-4f81-986e-893a849e4070"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..f003ef9f --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:32:02.603011Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "178b31e0-8699-3884-8d2b-fadd56d4ef64"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "178b31e0-8699-3884-8d2b-fadd56d4ef64"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e7492213-4528-457b-997e-7fd2ce0099cf"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-03-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:32:02.603011+00:00, try_number=1, job_id=209, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-27 00:00:00+00:00 +INFO - Started process 1492 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-03-27T00:00:00+00:00', '--job-id', '209', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpnzta3om3'] +INFO - Job 209: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-27T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180327T000000, start_date=20221111T003202, end_date=20221111T003205 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-03-27T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:32:05.831433Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e7492213-4528-457b-997e-7fd2ce0099cf"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..e893ed98 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:32:02.609286Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "178b31e0-8699-3884-8d2b-fadd56d4ef64"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "178b31e0-8699-3884-8d2b-fadd56d4ef64"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "62c446bd-eebc-4e62-96ac-585255fe0de4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-03-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:32:02.609286+00:00, try_number=1, job_id=210, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-27 00:00:00+00:00 +INFO - Started process 1494 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-03-27T00:00:00+00:00', '--job-id', '210', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp3dtkqa2h'] +INFO - Job 210: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-27T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180327T000000, start_date=20221111T003202, end_date=20221111T003205 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-03-27T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:32:05.824119Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "62c446bd-eebc-4e62-96ac-585255fe0de4"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..37d37909 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:32:13.489869Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "178b31e0-8699-3884-8d2b-fadd56d4ef64"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "178b31e0-8699-3884-8d2b-fadd56d4ef64"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "647e3b71-a9e8-4247-8faf-6a0ecae99b9f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-03-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:32:13.489869+00:00, try_number=1, job_id=214, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-27 00:00:00+00:00 +INFO - Started process 1577 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-03-27T00:00:00+00:00', '--job-id', '214', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpfqij21rv'] +INFO - Job 214: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-27T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa4ca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'Y4hvDNcz1kQAWRL65HX/tQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:Y4hvDNcz1kQAWRL65HX/tQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003214Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003214Z +20221111/us-east-1/s3/aws4_request +88d4667f17ade5ea9ae8558f649c65a0fce5781bd73ccd51e874ac03917fe4cb +INFO - '2022-11-11' - botocore.auth - Signature: +242d2babcd4a97aa5ad307dc7911d834374c883d75d741128d41dd3ad82a694d +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '1agzIkeKr46W/JXB/3XEqQTZlju6ol5Qjf89IrIt9z1N4S6Vis3nppw+1ZQaclmk8CRuhAFlIL8=', 'x-amz-request-id': '7975PW75SS5PHMF4', 'Date': 'Fri, 11 Nov 2022 00:32:15 GMT', 'ETag': '"63886f0cd733d644005912fae475ffb5"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180327T000000, start_date=20221111T003213, end_date=20221111T003215 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-03-27T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:32:15.625417Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "647e3b71-a9e8-4247-8faf-6a0ecae99b9f"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..65503280 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:32:12.587271Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "178b31e0-8699-3884-8d2b-fadd56d4ef64"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "178b31e0-8699-3884-8d2b-fadd56d4ef64"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "73908348-b4d2-403b-be17-b2b05edcae17"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-03-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:32:12.587271+00:00, try_number=1, job_id=213, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-27 00:00:00+00:00 +INFO - Started process 1500 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-03-27T00:00:00+00:00', '--job-id', '213', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpkc92_kh_'] +INFO - Job 213: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-27T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f1f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003213Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003213Z +20221111/us-east-1/s3/aws4_request +e5aa8a12d4c74e0b5871a4d9871ead574e69684819be1859f1a9e764690e7445 +INFO - '2022-11-11' - botocore.auth - Signature: +28e39e08300711a78532fa5a30c0fa6b472f3c7c42913a1c64d4d8f60207caf7 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '7xP5WHHTjSauNtYCgG+fhVfgW9+p9hMl2LJ3rDXJdmaDB8iDKpIvNGtBnbRyZSqXf4yAen2+zFg=', 'x-amz-request-id': 'HFYGVJYA3HAPZN14', 'Date': 'Fri, 11 Nov 2022 00:32:14 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180327T000000, start_date=20221111T003212, end_date=20221111T003214 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-03-27T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:32:14.827492Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "73908348-b4d2-403b-be17-b2b05edcae17"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..6245ef34 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:32:07.507903Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "178b31e0-8699-3884-8d2b-fadd56d4ef64"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "178b31e0-8699-3884-8d2b-fadd56d4ef64"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f411d2ce-8de1-43a4-be3b-d7e12d93126d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-03-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:32:07.507903+00:00, try_number=1, job_id=211, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-27 00:00:00+00:00 +INFO - Started process 1545 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-03-27T00:00:00+00:00', '--job-id', '211', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpo_5v_f9q'] +INFO - Job 211: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-27T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180327T000000, start_date=20221111T003207, end_date=20221111T003211 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-03-27T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:32:11.969386Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f411d2ce-8de1-43a4-be3b-d7e12d93126d"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..9bd6f286 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:32:07.517335Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "178b31e0-8699-3884-8d2b-fadd56d4ef64"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "178b31e0-8699-3884-8d2b-fadd56d4ef64"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "927c777b-80ed-414c-aa20-3711dc0c0842"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-03-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:32:07.517335+00:00, try_number=1, job_id=212, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-27 00:00:00+00:00 +INFO - Started process 1543 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-03-27T00:00:00+00:00', '--job-id', '212', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp4bvof1ll'] +INFO - Job 212: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-27T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180327T000000, start_date=20221111T003207, end_date=20221111T003210 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-03-27T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:32:10.207458Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "927c777b-80ed-414c-aa20-3711dc0c0842"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..4297f5e6 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:32:17.465514Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e01902ed-21ae-3271-9ed5-1852b0cd2c62"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e01902ed-21ae-3271-9ed5-1852b0cd2c62"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e17ce360-ea47-4fe8-99db-6e66747e4aeb"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-03-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:32:17.465514+00:00, try_number=1, job_id=215, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-28 00:00:00+00:00 +INFO - Started process 1611 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-03-28T00:00:00+00:00', '--job-id', '215', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpmiakydmt'] +INFO - Job 215: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-28T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180328T000000, start_date=20221111T003217, end_date=20221111T003221 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-03-28T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:32:21.346690Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e17ce360-ea47-4fe8-99db-6e66747e4aeb"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..a3614792 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:32:17.576738Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e01902ed-21ae-3271-9ed5-1852b0cd2c62"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e01902ed-21ae-3271-9ed5-1852b0cd2c62"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f6be471a-b454-47e5-a53c-e429dcab1aa2"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-03-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:32:17.576738+00:00, try_number=1, job_id=216, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-28 00:00:00+00:00 +INFO - Started process 1613 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-03-28T00:00:00+00:00', '--job-id', '216', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp1i0oaraw'] +INFO - Job 216: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-28T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180328T000000, start_date=20221111T003217, end_date=20221111T003221 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-03-28T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:32:21.323308Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f6be471a-b454-47e5-a53c-e429dcab1aa2"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..ea255cff --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:32:31.775248Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e01902ed-21ae-3271-9ed5-1852b0cd2c62"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e01902ed-21ae-3271-9ed5-1852b0cd2c62"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "05b47313-5f33-434d-887f-a619f9a46f04"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-03-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:32:31.775248+00:00, try_number=1, job_id=220, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-28 00:00:00+00:00 +INFO - Started process 1640 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-03-28T00:00:00+00:00', '--job-id', '220', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp00kxfdxo'] +INFO - Job 220: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-28T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5ee0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'Y4hvDNcz1kQAWRL65HX/tQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:Y4hvDNcz1kQAWRL65HX/tQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003232Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003232Z +20221111/us-east-1/s3/aws4_request +8e74fa31456ffaf92b96bb091762316aa30de0e91b1dc9949e256bd7a9e4674b +INFO - '2022-11-11' - botocore.auth - Signature: +820cb00aea145bfb06c58830de504e1692a5b323a0de4665e659be01b5bc0899 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'Lif8nT7mi14z6RQ1yn/KWQcG0V0siWVVPsT0h6kC3cjp0jbwN1DlxvTM7VS5RZKlNwz8NDVEVt0=', 'x-amz-request-id': 'H6ZPCVAFT674VNAX', 'Date': 'Fri, 11 Nov 2022 00:32:33 GMT', 'ETag': '"63886f0cd733d644005912fae475ffb5"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180328T000000, start_date=20221111T003231, end_date=20221111T003233 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-03-28T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:32:33.604990Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "05b47313-5f33-434d-887f-a619f9a46f04"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..7fe5328c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:32:29.144096Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e01902ed-21ae-3271-9ed5-1852b0cd2c62"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e01902ed-21ae-3271-9ed5-1852b0cd2c62"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "23d39176-98f2-4d1e-9973-8ca9091fec76"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-03-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:32:29.144096+00:00, try_number=1, job_id=219, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-28 00:00:00+00:00 +INFO - Started process 1633 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-03-28T00:00:00+00:00', '--job-id', '219', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp0hyqn6ow'] +INFO - Job 219: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-28T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50051f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003230Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003230Z +20221111/us-east-1/s3/aws4_request +2f94c26d104b127681eb1eae2be8250903479c1ddb97ecf80427f02b68b32d10 +INFO - '2022-11-11' - botocore.auth - Signature: +78961ff3978e5773ed32c0ac22c2522842cb1b949b3de26d2733c729ba2c3330 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'mxa1UN3jBb0kT0if747iPvAR/mlw9opjYmIV8Damess6SAv3bi+gUnXKDkh845JTOUS0sXMb7iU=', 'x-amz-request-id': 'Z3CBJBJ5G0AN65RG', 'Date': 'Fri, 11 Nov 2022 00:32:30 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180328T000000, start_date=20221111T003229, end_date=20221111T003231 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-03-28T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:32:31.363389Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "23d39176-98f2-4d1e-9973-8ca9091fec76"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..fa7b209f --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:32:24.310185Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e01902ed-21ae-3271-9ed5-1852b0cd2c62"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e01902ed-21ae-3271-9ed5-1852b0cd2c62"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6b13a672-b281-4c0f-ba90-90bb6f3f3f42"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-03-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:32:24.310185+00:00, try_number=1, job_id=218, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-28 00:00:00+00:00 +INFO - Started process 1551 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-03-28T00:00:00+00:00', '--job-id', '218', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmplosoo0kw'] +INFO - Job 218: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-28T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180328T000000, start_date=20221111T003224, end_date=20221111T003230 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-03-28T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:32:30.545462Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6b13a672-b281-4c0f-ba90-90bb6f3f3f42"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..0343ce2a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:32:24.303705Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e01902ed-21ae-3271-9ed5-1852b0cd2c62"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e01902ed-21ae-3271-9ed5-1852b0cd2c62"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7164eb5a-6bea-4495-8379-e11ed1e912ab"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-03-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:32:24.303705+00:00, try_number=1, job_id=217, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-28 00:00:00+00:00 +INFO - Started process 1542 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-03-28T00:00:00+00:00', '--job-id', '217', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp0weebr37'] +INFO - Job 217: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-28T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180328T000000, start_date=20221111T003224, end_date=20221111T003227 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-03-28T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:32:27.480448Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7164eb5a-6bea-4495-8379-e11ed1e912ab"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..38a40ee8 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:32:35.720237Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-29T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "394cf595-1bdd-39b3-877d-fe0b51e8d6b1"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "394cf595-1bdd-39b3-877d-fe0b51e8d6b1"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8a4e5d55-09fc-430d-972c-2f749211c93c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-03-29T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:32:35.720237+00:00, try_number=1, job_id=222, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-29 00:00:00+00:00 +INFO - Started process 1586 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-03-29T00:00:00+00:00', '--job-id', '222', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp35_t1j5k'] +INFO - Job 222: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-29T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-29T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180329T000000, start_date=20221111T003235, end_date=20221111T003238 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-03-29T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:32:38.504820Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8a4e5d55-09fc-430d-972c-2f749211c93c"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..ce5bfe23 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:32:35.717723Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-29T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "394cf595-1bdd-39b3-877d-fe0b51e8d6b1"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "394cf595-1bdd-39b3-877d-fe0b51e8d6b1"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "929cc58c-8cf6-4809-a6f0-fffde00565aa"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-03-29T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:32:35.717723+00:00, try_number=1, job_id=221, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-29 00:00:00+00:00 +INFO - Started process 1583 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-03-29T00:00:00+00:00', '--job-id', '221', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp44hicyyl'] +INFO - Job 221: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-29T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-29T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180329T000000, start_date=20221111T003235, end_date=20221111T003238 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-03-29T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:32:38.594793Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "929cc58c-8cf6-4809-a6f0-fffde00565aa"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..c2b2864e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:32:45.314380Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-29T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "394cf595-1bdd-39b3-877d-fe0b51e8d6b1"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "394cf595-1bdd-39b3-877d-fe0b51e8d6b1"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "36f6b969-da68-4281-b4d8-56f804af0ea8"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-03-29T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:32:45.314380+00:00, try_number=1, job_id=226, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-29 00:00:00+00:00 +INFO - Started process 1696 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-03-29T00:00:00+00:00', '--job-id', '226', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp2vzfa36o'] +INFO - Job 226: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-29T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-29T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa3ee0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '4JU66o9QeprRSq1mqC+HKQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:4JU66o9QeprRSq1mqC+HKQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003246Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003246Z +20221111/us-east-1/s3/aws4_request +bf16d8690d8ec0aad46eea9c7bd7f82a0382f362a1b4ee8059297c206761b453 +INFO - '2022-11-11' - botocore.auth - Signature: +85b3ccc0bf03f87571d978fc39618c4ccf9ea08c1bd6d6a15109ec2e79b934a3 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '2XXNTLWZyzaVjhUZfpPrIoIAozImwDb4krRDSaLuVmlNB4sof76+zG2h/lEF8Altnqg7XJS5H78=', 'x-amz-request-id': 'N6YJTFTW8K4BQ152', 'Date': 'Fri, 11 Nov 2022 00:32:47 GMT', 'ETag': '"e0953aea8f507a9ad14aad66a82f8729"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180329T000000, start_date=20221111T003245, end_date=20221111T003247 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-03-29T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:32:47.867539Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "36f6b969-da68-4281-b4d8-56f804af0ea8"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..8672f076 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:32:43.565943Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-29T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "394cf595-1bdd-39b3-877d-fe0b51e8d6b1"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "394cf595-1bdd-39b3-877d-fe0b51e8d6b1"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e54e49b0-69e5-44ce-80e9-732470705d58"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-03-29T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:32:43.565943+00:00, try_number=1, job_id=225, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-29 00:00:00+00:00 +INFO - Started process 1677 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-03-29T00:00:00+00:00', '--job-id', '225', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpzke5ebr9'] +INFO - Job 225: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-29T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-29T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5ee0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003244Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003244Z +20221111/us-east-1/s3/aws4_request +c59bf7b3a4f35478690a0e8a9ebbf23c15671aa07a9f859a6f385431d960e9bf +INFO - '2022-11-11' - botocore.auth - Signature: +594853a561da1a009f1536518d2d3c51a46e6832cdc7622bad54733f683591d4 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '8eQH/IPwSA0uDElZqQCnSPFr7bvv7Km3ZaGDMtIGy/80+mWVVVy4VUmmxdgHdVMhjCeIBPst04I=', 'x-amz-request-id': 'JCWRHRKFQMCKG5BK', 'Date': 'Fri, 11 Nov 2022 00:32:44 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180329T000000, start_date=20221111T003243, end_date=20221111T003245 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-03-29T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:32:45.656384Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e54e49b0-69e5-44ce-80e9-732470705d58"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..75673f89 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:32:39.821693Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-29T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "394cf595-1bdd-39b3-877d-fe0b51e8d6b1"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "394cf595-1bdd-39b3-877d-fe0b51e8d6b1"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "50628fdb-9a6c-4621-9999-40d0b7733f06"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-03-29T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:32:39.821693+00:00, try_number=1, job_id=223, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-29 00:00:00+00:00 +INFO - Started process 1649 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-03-29T00:00:00+00:00', '--job-id', '223', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpp8dopo2y'] +INFO - Job 223: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-29T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-29T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180329T000000, start_date=20221111T003239, end_date=20221111T003243 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-03-29T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:32:43.441742Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "50628fdb-9a6c-4621-9999-40d0b7733f06"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..38c4dca1 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:32:39.860116Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-29T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "394cf595-1bdd-39b3-877d-fe0b51e8d6b1"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "394cf595-1bdd-39b3-877d-fe0b51e8d6b1"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "63ea4309-fb92-41f2-881b-ba08e28e4580"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-03-29T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:32:39.860116+00:00, try_number=1, job_id=224, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-29 00:00:00+00:00 +INFO - Started process 1651 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-03-29T00:00:00+00:00', '--job-id', '224', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp2jw3nw_5'] +INFO - Job 224: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-29T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-29T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180329T000000, start_date=20221111T003239, end_date=20221111T003242 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-03-29T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:32:42.458540Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "63ea4309-fb92-41f2-881b-ba08e28e4580"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..5c219dff --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:32:50.454456Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-30T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "66c0a838-62db-3caf-b877-d00f8c5ce5cc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "66c0a838-62db-3caf-b877-d00f8c5ce5cc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ffd9688f-f12b-42b0-8e47-27abd3e7a069"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-03-30T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:32:50.454456+00:00, try_number=1, job_id=228, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-30 00:00:00+00:00 +INFO - Started process 1596 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-03-30T00:00:00+00:00', '--job-id', '228', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpvdh8f7uh'] +INFO - Job 228: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-30T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-30T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180330T000000, start_date=20221111T003250, end_date=20221111T003253 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-03-30T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:32:53.398097Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ffd9688f-f12b-42b0-8e47-27abd3e7a069"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..2551d572 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:32:50.448509Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-30T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "66c0a838-62db-3caf-b877-d00f8c5ce5cc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "66c0a838-62db-3caf-b877-d00f8c5ce5cc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a7219ccc-b7e9-4028-b6aa-b0ac48fcd35d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-03-30T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:32:50.448509+00:00, try_number=1, job_id=227, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-30 00:00:00+00:00 +INFO - Started process 1595 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-03-30T00:00:00+00:00', '--job-id', '227', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpj2q1ldzz'] +INFO - Job 227: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-30T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-30T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180330T000000, start_date=20221111T003250, end_date=20221111T003253 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-03-30T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:32:53.380647Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a7219ccc-b7e9-4028-b6aa-b0ac48fcd35d"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..26db2edc --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:33:02.881802Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-30T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "66c0a838-62db-3caf-b877-d00f8c5ce5cc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "66c0a838-62db-3caf-b877-d00f8c5ce5cc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "774d92b4-57ac-48db-af5b-85feb7ee28ee"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-03-30T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:33:02.881802+00:00, try_number=1, job_id=232, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-30 00:00:00+00:00 +INFO - Started process 1746 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-03-30T00:00:00+00:00', '--job-id', '232', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpbfqesl8s'] +INFO - Job 232: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-30T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-30T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa4f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'kFNYenjcgGZgu0ODo4JhUQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:kFNYenjcgGZgu0ODo4JhUQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003303Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003303Z +20221111/us-east-1/s3/aws4_request +991b632f9975569b468a1ee10dd13201a9b4f425271da2b61258ea653b842a0f +INFO - '2022-11-11' - botocore.auth - Signature: +00d136846ab60a43d1da58e37370af0fe87c9f9df69bcc0329bf0f4e129cb482 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '5hx59OjAwv1h9BYtZufxOs2hAbOQsj7iHmWfIfnAc+WlmjUQ+QCid8eTVaBlYsbQynuB/2tyAAg=', 'x-amz-request-id': 'KMKJW9FTZXDSP3JY', 'Date': 'Fri, 11 Nov 2022 00:33:03 GMT', 'ETag': '"9053587a78dc806660bb4383a3826151"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180330T000000, start_date=20221111T003302, end_date=20221111T003304 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-03-30T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:33:04.518018Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "774d92b4-57ac-48db-af5b-85feb7ee28ee"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..33e5ddd2 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:33:01.190918Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-30T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "66c0a838-62db-3caf-b877-d00f8c5ce5cc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "66c0a838-62db-3caf-b877-d00f8c5ce5cc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ae45e0f6-1a94-4095-893b-462605368bd9"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-03-30T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:33:01.190918+00:00, try_number=1, job_id=231, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-30 00:00:00+00:00 +INFO - Started process 1667 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-03-30T00:00:00+00:00', '--job-id', '231', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpl02xrfke'] +INFO - Job 231: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-30T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-30T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499541f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003302Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003302Z +20221111/us-east-1/s3/aws4_request +231a69b36ad525af85fd67c8a7f77d7cd692a0970e4e620d0c8a9d93144a4c9a +INFO - '2022-11-11' - botocore.auth - Signature: +4a620430c299939d7b91d0fdd393848dac30a822658631777b0e2c78a11ac3dd +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'g+Hv+CmRSBu6vXO8z5Fnx9VIYb4yTF5y4nYWGD89xINaYKmYLdjNod/RfStzTjTX78DCl2bAyXc=', 'x-amz-request-id': 'JT45XR33MNDX9YMZ', 'Date': 'Fri, 11 Nov 2022 00:33:02 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180330T000000, start_date=20221111T003301, end_date=20221111T003303 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-03-30T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:33:03.472541Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ae45e0f6-1a94-4095-893b-462605368bd9"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..69ad9250 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:32:55.603974Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-30T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "66c0a838-62db-3caf-b877-d00f8c5ce5cc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "66c0a838-62db-3caf-b877-d00f8c5ce5cc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "efc74297-d899-4193-8084-fb9401f70a24"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-03-30T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:32:55.603974+00:00, try_number=1, job_id=229, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-30 00:00:00+00:00 +INFO - Started process 1736 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-03-30T00:00:00+00:00', '--job-id', '229', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpvl__p_sd'] +INFO - Job 229: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-30T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-30T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180330T000000, start_date=20221111T003255, end_date=20221111T003301 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-03-30T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:33:01.280347Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "efc74297-d899-4193-8084-fb9401f70a24"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..6ecad6c5 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:32:55.687821Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-30T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "66c0a838-62db-3caf-b877-d00f8c5ce5cc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "66c0a838-62db-3caf-b877-d00f8c5ce5cc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a516bbaf-abc8-4314-8b37-be1ab9ea81ca"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-03-30T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:32:55.687821+00:00, try_number=1, job_id=230, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-30 00:00:00+00:00 +INFO - Started process 1738 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-03-30T00:00:00+00:00', '--job-id', '230', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpnkvdcv1i'] +INFO - Job 230: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-30T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-30T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180330T000000, start_date=20221111T003255, end_date=20221111T003259 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-03-30T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:32:59.467188Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a516bbaf-abc8-4314-8b37-be1ab9ea81ca"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..bec268f4 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:33:07.098571Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-31T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9fb95986-7feb-3101-b9d8-65b75771d048"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9fb95986-7feb-3101-b9d8-65b75771d048"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c4ce2fd4-453e-4aee-a284-fe070a37eb2a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-03-31T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:33:07.098571+00:00, try_number=1, job_id=234, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-31 00:00:00+00:00 +INFO - Started process 1757 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-03-31T00:00:00+00:00', '--job-id', '234', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpk_v8uidi'] +INFO - Job 234: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-31T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-31T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180331T000000, start_date=20221111T003307, end_date=20221111T003310 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-03-31T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:33:10.219518Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c4ce2fd4-453e-4aee-a284-fe070a37eb2a"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..dd7bf6b3 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:33:07.083317Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-31T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9fb95986-7feb-3101-b9d8-65b75771d048"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9fb95986-7feb-3101-b9d8-65b75771d048"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7942f416-cacc-4568-9961-0d0a696c7248"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-03-31T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:33:07.083317+00:00, try_number=1, job_id=233, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-31 00:00:00+00:00 +INFO - Started process 1755 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-03-31T00:00:00+00:00', '--job-id', '233', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpd74fib4a'] +INFO - Job 233: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-31T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-31T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180331T000000, start_date=20221111T003307, end_date=20221111T003310 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-03-31T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:33:10.249411Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7942f416-cacc-4568-9961-0d0a696c7248"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..c197cbff --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:33:17.485044Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-31T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9fb95986-7feb-3101-b9d8-65b75771d048"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9fb95986-7feb-3101-b9d8-65b75771d048"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ea86d7ea-5d74-4fc3-ae96-fb12aa84a22f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-03-31T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:33:17.485044+00:00, try_number=1, job_id=238, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-31 00:00:00+00:00 +INFO - Started process 1674 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-03-31T00:00:00+00:00', '--job-id', '238', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpw0mteleq'] +INFO - Job 238: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-31T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-31T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'OHIGlRH6LduLNYAJ4YXLnw==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:OHIGlRH6LduLNYAJ4YXLnw== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003318Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003318Z +20221111/us-east-1/s3/aws4_request +aeeaffccce8a4b6874f8831d1665ed90c7cd48d9d72a1c99292a625114745553 +INFO - '2022-11-11' - botocore.auth - Signature: +f2ea74f6cc0fc98a20d156e7cf9ba51ed6b6d834d76ee98fc4a7cebca26c5977 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'GBE+nJ2K7wCZiQ+1ubNRmxBjrGPz6CfBbbhjbtwZ0pvuZ+0DUK6tgyytZEZXw5IQns3GsjcqWCk=', 'x-amz-request-id': 'K1G89F27WHM8H7M8', 'Date': 'Fri, 11 Nov 2022 00:33:18 GMT', 'ETag': '"3872069511fa2ddb8b358009e185cb9f"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180331T000000, start_date=20221111T003317, end_date=20221111T003319 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-03-31T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:33:19.056369Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ea86d7ea-5d74-4fc3-ae96-fb12aa84a22f"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..884e2b4c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:33:16.314223Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-31T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9fb95986-7feb-3101-b9d8-65b75771d048"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9fb95986-7feb-3101-b9d8-65b75771d048"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9ee54448-7ec8-4cfb-b4a7-666a9a7d5dfe"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-03-31T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:33:16.314223+00:00, try_number=1, job_id=237, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-31 00:00:00+00:00 +INFO - Started process 1809 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-03-31T00:00:00+00:00', '--job-id', '237', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp_87vjphs'] +INFO - Job 237: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-31T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-31T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003317Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003317Z +20221111/us-east-1/s3/aws4_request +1da763d353ca53f08be24d033098cb165cbc653fd3923226f13a1c230c2cc9a9 +INFO - '2022-11-11' - botocore.auth - Signature: +7571d3f587955b56fdab2d03fef02408f00ef0d86b45347b68dd489a6d01af95 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'kJuk/Y94bojkDVhrN+z7Jk/BXDhYBz05rqRBqxXhVwUbhNtiE9Hznbe4FpEF9+CLO8z2dQ0kzXA=', 'x-amz-request-id': 'DHATG69YZ0BVMBEY', 'Date': 'Fri, 11 Nov 2022 00:33:17 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180331T000000, start_date=20221111T003316, end_date=20221111T003318 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-03-31T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:33:18.576636Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9ee54448-7ec8-4cfb-b4a7-666a9a7d5dfe"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..a8a53d33 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:33:11.641729Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-31T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9fb95986-7feb-3101-b9d8-65b75771d048"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9fb95986-7feb-3101-b9d8-65b75771d048"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "89572394-300b-4c40-9680-0865b2becc22"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-03-31T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:33:11.641729+00:00, try_number=1, job_id=235, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-31 00:00:00+00:00 +INFO - Started process 1780 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-03-31T00:00:00+00:00', '--job-id', '235', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmptwnjcloh'] +INFO - Job 235: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-31T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-31T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180331T000000, start_date=20221111T003311, end_date=20221111T003315 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-03-31T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:33:15.676341Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "89572394-300b-4c40-9680-0865b2becc22"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..f239305d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-03-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:33:11.686118Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-03-31T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9fb95986-7feb-3101-b9d8-65b75771d048"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9fb95986-7feb-3101-b9d8-65b75771d048"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3e2fc962-44f7-42e6-ba59-3285a76c328e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-03-31T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:33:11.686118+00:00, try_number=1, job_id=236, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-03-31 00:00:00+00:00 +INFO - Started process 1782 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-03-31T00:00:00+00:00', '--job-id', '236', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmph9_nsc8_'] +INFO - Job 236: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-03-31T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-03-31T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180331T000000, start_date=20221111T003311, end_date=20221111T003314 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-03-31T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:33:14.416063Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3e2fc962-44f7-42e6-ba59-3285a76c328e"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..25ad99b1 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:33:20.887284Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a8b7f6b2-a2de-3a7a-b19f-46b425cb01c1"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a8b7f6b2-a2de-3a7a-b19f-46b425cb01c1"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "43d650ef-a724-4cd2-879a-bb0cd9985561"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-04-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:33:20.887284+00:00, try_number=1, job_id=239, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-01 00:00:00+00:00 +INFO - Started process 1843 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-04-01T00:00:00+00:00', '--job-id', '239', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpbzxlqfup'] +INFO - Job 239: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180401T000000, start_date=20221111T003320, end_date=20221111T003323 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-04-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:33:23.741427Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "43d650ef-a724-4cd2-879a-bb0cd9985561"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..2986ee95 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:33:20.890537Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a8b7f6b2-a2de-3a7a-b19f-46b425cb01c1"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a8b7f6b2-a2de-3a7a-b19f-46b425cb01c1"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b16a01b3-4578-41a9-a313-c2917e823cd2"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-04-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:33:20.890537+00:00, try_number=1, job_id=240, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-01 00:00:00+00:00 +INFO - Started process 1844 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-04-01T00:00:00+00:00', '--job-id', '240', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpqycg7ugu'] +INFO - Job 240: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180401T000000, start_date=20221111T003320, end_date=20221111T003323 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-04-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:33:23.742891Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b16a01b3-4578-41a9-a313-c2917e823cd2"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..6757ecde --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:33:30.511082Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a8b7f6b2-a2de-3a7a-b19f-46b425cb01c1"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a8b7f6b2-a2de-3a7a-b19f-46b425cb01c1"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0c1f37de-3948-41bf-bbc5-5fb940dc1f38"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-04-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:33:30.511082+00:00, try_number=1, job_id=244, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-01 00:00:00+00:00 +INFO - Started process 1750 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-04-01T00:00:00+00:00', '--job-id', '244', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp6sc4mzjl'] +INFO - Job 244: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498ef940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'OHIGlRH6LduLNYAJ4YXLnw==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:OHIGlRH6LduLNYAJ4YXLnw== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003331Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003331Z +20221111/us-east-1/s3/aws4_request +da4093ee5265915dfb43fffe4d447813a9c63b04d4843545bc2b3f3dfea72f19 +INFO - '2022-11-11' - botocore.auth - Signature: +c1e0d7c4495d41569fd1f39b951841e97042f8f8de799f84a591bc738cfd177f +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'NkpXV9qJv26b23FCCPdGXMBquknC7pVlqo1bmLDwOYZjLKMl2QgVN7RyIAOck3LXKG0hIhNZEug=', 'x-amz-request-id': 'GV6PXS5X1459KM2Z', 'Date': 'Fri, 11 Nov 2022 00:33:31 GMT', 'ETag': '"3872069511fa2ddb8b358009e185cb9f"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180401T000000, start_date=20221111T003330, end_date=20221111T003332 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-04-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:33:32.362877Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0c1f37de-3948-41bf-bbc5-5fb940dc1f38"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..96fa0b8b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:33:30.466214Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a8b7f6b2-a2de-3a7a-b19f-46b425cb01c1"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a8b7f6b2-a2de-3a7a-b19f-46b425cb01c1"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2d311353-23c2-4191-a66b-eec796b05fb2"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-04-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:33:30.466214+00:00, try_number=1, job_id=243, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-01 00:00:00+00:00 +INFO - Started process 1748 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-04-01T00:00:00+00:00', '--job-id', '243', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmprogz2zd8'] +INFO - Job 243: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498ef940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003331Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003331Z +20221111/us-east-1/s3/aws4_request +473512a14372fcbcc59bb7c043c62e2f33ff1e23a366368f837fab430aa45f04 +INFO - '2022-11-11' - botocore.auth - Signature: +1b66527ead9643b718d29ebc818117bf06c7f39639198a3ae62c63cdc5c3c2a7 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '3DQWAyBdSma7v4fvXKdOEF3YNfa7i7yCRcX3xlzjKQkGIVgRP8OYJgMch38uYxEmaSrcTWh7k2c=', 'x-amz-request-id': 'GV6HBJJS48AB5FMC', 'Date': 'Fri, 11 Nov 2022 00:33:31 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180401T000000, start_date=20221111T003330, end_date=20221111T003332 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-04-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:33:32.205469Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2d311353-23c2-4191-a66b-eec796b05fb2"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..342a94ed --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:33:25.535688Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a8b7f6b2-a2de-3a7a-b19f-46b425cb01c1"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a8b7f6b2-a2de-3a7a-b19f-46b425cb01c1"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "400ab7f5-3d62-47b8-9b27-db032c90dac7"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-04-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:33:25.535688+00:00, try_number=1, job_id=242, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-01 00:00:00+00:00 +INFO - Started process 1854 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-04-01T00:00:00+00:00', '--job-id', '242', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpsllcpq4d'] +INFO - Job 242: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180401T000000, start_date=20221111T003325, end_date=20221111T003329 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-04-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:33:29.306210Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "400ab7f5-3d62-47b8-9b27-db032c90dac7"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..35c1d939 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:33:25.460716Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a8b7f6b2-a2de-3a7a-b19f-46b425cb01c1"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a8b7f6b2-a2de-3a7a-b19f-46b425cb01c1"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f4da8f2c-b9e2-4dbb-ba82-2efbb38a2f5f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-04-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:33:25.460716+00:00, try_number=1, job_id=241, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-01 00:00:00+00:00 +INFO - Started process 1852 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-04-01T00:00:00+00:00', '--job-id', '241', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpd9h3_b93'] +INFO - Job 241: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180401T000000, start_date=20221111T003325, end_date=20221111T003329 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-04-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:33:29.029724Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f4da8f2c-b9e2-4dbb-ba82-2efbb38a2f5f"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..fba83dd5 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:33:34.199046Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e4593a98-fea7-330e-8a7b-8e5d4ebeb185"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e4593a98-fea7-330e-8a7b-8e5d4ebeb185"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0509f629-f97c-47af-bbf9-821e50e599a1"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-04-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:33:34.199046+00:00, try_number=1, job_id=245, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-02 00:00:00+00:00 +INFO - Started process 1868 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-04-02T00:00:00+00:00', '--job-id', '245', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpq89j__tv'] +INFO - Job 245: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180402T000000, start_date=20221111T003334, end_date=20221111T003336 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-04-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:33:36.892989Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0509f629-f97c-47af-bbf9-821e50e599a1"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..a1398b22 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:33:34.205006Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e4593a98-fea7-330e-8a7b-8e5d4ebeb185"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e4593a98-fea7-330e-8a7b-8e5d4ebeb185"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "17233d4b-3ae3-45e6-8497-7bff88b8d929"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-04-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:33:34.205006+00:00, try_number=1, job_id=246, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-02 00:00:00+00:00 +INFO - Started process 1869 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-04-02T00:00:00+00:00', '--job-id', '246', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpmlq28ttx'] +INFO - Job 246: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180402T000000, start_date=20221111T003334, end_date=20221111T003337 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-04-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:33:37.268231Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "17233d4b-3ae3-45e6-8497-7bff88b8d929"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..007b897e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:33:43.667513Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e4593a98-fea7-330e-8a7b-8e5d4ebeb185"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e4593a98-fea7-330e-8a7b-8e5d4ebeb185"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "33d0dce6-b081-4700-b21a-702ea9417464"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-04-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:33:43.667513+00:00, try_number=1, job_id=250, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-02 00:00:00+00:00 +INFO - Started process 1776 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-04-02T00:00:00+00:00', '--job-id', '250', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmphwcmndh8'] +INFO - Job 250: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0ca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '4XJ+C1Nzm3hYfoyhtACZQw==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:4XJ+C1Nzm3hYfoyhtACZQw== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003344Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003344Z +20221111/us-east-1/s3/aws4_request +2f8af529b4e5bf5cafa0e413c9b8e176d52248b46ea37cab544389c17a5e6de5 +INFO - '2022-11-11' - botocore.auth - Signature: +5e40b49d7fbb147f7fc93a706241b3c4c69c2afec743ae27cb44a9d2afabb2e2 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'Ne2yKZaMW8g866p6ZkxExnkqBKkbXw1/lcgQrRb67zZYOzfTbwtWSql6LslD5LmgKXcjPAxuP2A=', 'x-amz-request-id': 'D6YRJ9TCT8B0067M', 'Date': 'Fri, 11 Nov 2022 00:33:44 GMT', 'ETag': '"e1727e0b53739b78587e8ca1b4009943"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180402T000000, start_date=20221111T003343, end_date=20221111T003345 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-04-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:33:45.364565Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "33d0dce6-b081-4700-b21a-702ea9417464"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..13aad77a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:33:41.987915Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e4593a98-fea7-330e-8a7b-8e5d4ebeb185"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e4593a98-fea7-330e-8a7b-8e5d4ebeb185"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3add0353-7f09-485d-9ce2-f9048c315058"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-04-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:33:41.987915+00:00, try_number=1, job_id=249, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-02 00:00:00+00:00 +INFO - Started process 1770 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-04-02T00:00:00+00:00', '--job-id', '249', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpe84jo8h5'] +INFO - Job 249: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499521f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003342Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003342Z +20221111/us-east-1/s3/aws4_request +e1d2a315c9e148ac1c24e9b59e01beac900628a031addb80e07a630492e80862 +INFO - '2022-11-11' - botocore.auth - Signature: +22d89ab6bf0853f4fb50d97bcc764a8159139043d80be3e85dca9bae7e857613 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'VXKVlxZXBQZUyQxTnxCro97xGtE/eegjiQakT8GZ5DYGAnBqGBsVVmFGQ1OuN4maUR/uInqh9og=', 'x-amz-request-id': '5FXT40CW4B0B8NBR', 'Date': 'Fri, 11 Nov 2022 00:33:43 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180402T000000, start_date=20221111T003341, end_date=20221111T003343 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-04-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:33:43.786179Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3add0353-7f09-485d-9ce2-f9048c315058"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..33abb033 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:33:38.367686Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e4593a98-fea7-330e-8a7b-8e5d4ebeb185"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e4593a98-fea7-330e-8a7b-8e5d4ebeb185"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6e144423-499f-49cd-85ff-3e0c4d160337"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-04-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:33:38.367686+00:00, try_number=1, job_id=247, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-02 00:00:00+00:00 +INFO - Started process 1762 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-04-02T00:00:00+00:00', '--job-id', '247', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpko8zr00o'] +INFO - Job 247: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180402T000000, start_date=20221111T003338, end_date=20221111T003341 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-04-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:33:41.998558Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6e144423-499f-49cd-85ff-3e0c4d160337"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..9b3643d6 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:33:38.379833Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e4593a98-fea7-330e-8a7b-8e5d4ebeb185"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e4593a98-fea7-330e-8a7b-8e5d4ebeb185"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8f12f0eb-9dc0-4984-973f-d76b1f3e721c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-04-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:33:38.379833+00:00, try_number=1, job_id=248, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-02 00:00:00+00:00 +INFO - Started process 1764 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-04-02T00:00:00+00:00', '--job-id', '248', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpb79rxvx6'] +INFO - Job 248: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180402T000000, start_date=20221111T003338, end_date=20221111T003340 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-04-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:33:40.708110Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8f12f0eb-9dc0-4984-973f-d76b1f3e721c"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..61c532dc --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:33:47.636570Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f06e30c7-7e08-31e1-b8b1-e6ad09713acc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f06e30c7-7e08-31e1-b8b1-e6ad09713acc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ed0f81c1-31fe-4fca-8058-205b9c93c449"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-04-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:33:47.636570+00:00, try_number=1, job_id=251, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-03 00:00:00+00:00 +INFO - Started process 1787 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-04-03T00:00:00+00:00', '--job-id', '251', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpz1g70mmn'] +INFO - Job 251: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180403T000000, start_date=20221111T003347, end_date=20221111T003350 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-04-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:33:50.444054Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ed0f81c1-31fe-4fca-8058-205b9c93c449"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..c4cffc23 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:33:47.633982Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f06e30c7-7e08-31e1-b8b1-e6ad09713acc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f06e30c7-7e08-31e1-b8b1-e6ad09713acc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fec77356-a160-4e94-86bd-e28ee08be652"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-04-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:33:47.633982+00:00, try_number=1, job_id=252, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-03 00:00:00+00:00 +INFO - Started process 1788 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-04-03T00:00:00+00:00', '--job-id', '252', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp1q2j1qeu'] +INFO - Job 252: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180403T000000, start_date=20221111T003347, end_date=20221111T003350 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-04-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:33:50.442186Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fec77356-a160-4e94-86bd-e28ee08be652"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..1a999a31 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:33:56.811392Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f06e30c7-7e08-31e1-b8b1-e6ad09713acc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f06e30c7-7e08-31e1-b8b1-e6ad09713acc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "af6dea11-4328-4f29-aa39-397d47797bad"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-04-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:33:56.811392+00:00, try_number=1, job_id=256, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-03 00:00:00+00:00 +INFO - Started process 1949 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-04-03T00:00:00+00:00', '--job-id', '256', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpj00qd0lh'] +INFO - Job 256: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'HDiU4YOmP09AsFV/asm+kw==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:HDiU4YOmP09AsFV/asm+kw== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003357Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003357Z +20221111/us-east-1/s3/aws4_request +6e5303ecd90416edd6d3ae3ba6d642131534e697b194cbf0c7d052893185ccea +INFO - '2022-11-11' - botocore.auth - Signature: +64986a6ce7b7bd06ac39ee40cdf4b20b24fa6d81a67824f35eacc585ea622095 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'QyjymD6xXf7pQHrlvaiIG0Qd71ueJeta8/Z/GJRSTj9yoz5ZcCMLUPD9tbeKns++1acD6BqejUENijYIGOQoZQ==', 'x-amz-request-id': 'V64X35JHZA23DAGQ', 'Date': 'Fri, 11 Nov 2022 00:33:58 GMT', 'ETag': '"1c3894e183a63f4f40b0557f6ac9be93"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180403T000000, start_date=20221111T003356, end_date=20221111T003358 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-04-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:33:58.810049Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "af6dea11-4328-4f29-aa39-397d47797bad"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..f59b76d0 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:33:56.737041Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f06e30c7-7e08-31e1-b8b1-e6ad09713acc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f06e30c7-7e08-31e1-b8b1-e6ad09713acc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "09fa7696-7f9d-4aa6-bfac-fc9b74b6ee6e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-04-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:33:56.737041+00:00, try_number=1, job_id=255, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-03 00:00:00+00:00 +INFO - Started process 1947 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-04-03T00:00:00+00:00', '--job-id', '255', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpm_hctusk'] +INFO - Job 255: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003357Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003357Z +20221111/us-east-1/s3/aws4_request +4f5b891010104c5216d9010da2a925c292dd0fcc1636c22f77b9de48e16a478d +INFO - '2022-11-11' - botocore.auth - Signature: +2840a53ed9384e04da84080100577c78579f741a0d347c1977cb223938e0fb24 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'qKJIzRNxT5Uk+qAzYNTFyy4082lD4765RJOSx5vT5W8MYFeZ7VYbggDgkOxOt5JOizPc/+bnOxaR4lLj/K1zKg==', 'x-amz-request-id': 'V64VKQRDM1V8B4BB', 'Date': 'Fri, 11 Nov 2022 00:33:58 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180403T000000, start_date=20221111T003356, end_date=20221111T003358 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-04-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:33:58.696121Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "09fa7696-7f9d-4aa6-bfac-fc9b74b6ee6e"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..f9b168f8 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:33:52.436660Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f06e30c7-7e08-31e1-b8b1-e6ad09713acc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f06e30c7-7e08-31e1-b8b1-e6ad09713acc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ee66996d-5d08-401f-83e1-396251ab701e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-04-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:33:52.436660+00:00, try_number=1, job_id=253, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-03 00:00:00+00:00 +INFO - Started process 1938 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-04-03T00:00:00+00:00', '--job-id', '253', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmper4ce705'] +INFO - Job 253: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180403T000000, start_date=20221111T003352, end_date=20221111T003355 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-04-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:33:55.583976Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ee66996d-5d08-401f-83e1-396251ab701e"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..fbcf5ad6 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:33:52.456319Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f06e30c7-7e08-31e1-b8b1-e6ad09713acc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f06e30c7-7e08-31e1-b8b1-e6ad09713acc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fdb76db5-5bba-4a58-b48f-32d0c2b03cea"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-04-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:33:52.456319+00:00, try_number=1, job_id=254, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-03 00:00:00+00:00 +INFO - Started process 1939 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-04-03T00:00:00+00:00', '--job-id', '254', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpgeg_a6fp'] +INFO - Job 254: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180403T000000, start_date=20221111T003352, end_date=20221111T003355 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-04-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:33:55.271696Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fdb76db5-5bba-4a58-b48f-32d0c2b03cea"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..18ae9372 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:34:01.047476Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0b4bf562-61cd-3035-aa50-eb54f87a5cb3"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0b4bf562-61cd-3035-aa50-eb54f87a5cb3"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "303d1005-4c55-4c0e-9834-d09718c38d68"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-04-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:34:01.047476+00:00, try_number=1, job_id=258, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-04 00:00:00+00:00 +INFO - Started process 1862 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-04-04T00:00:00+00:00', '--job-id', '258', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp4rr86bs9'] +INFO - Job 258: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180404T000000, start_date=20221111T003401, end_date=20221111T003405 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-04-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:34:05.092559Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "303d1005-4c55-4c0e-9834-d09718c38d68"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..fcbd4f7f --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:34:01.045605Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0b4bf562-61cd-3035-aa50-eb54f87a5cb3"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0b4bf562-61cd-3035-aa50-eb54f87a5cb3"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ae2eb868-ddc4-4703-a6f1-5edb08c51c1b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-04-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:34:01.045605+00:00, try_number=1, job_id=257, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-04 00:00:00+00:00 +INFO - Started process 1863 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-04-04T00:00:00+00:00', '--job-id', '257', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp1hs4_o73'] +INFO - Job 257: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180404T000000, start_date=20221111T003401, end_date=20221111T003403 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-04-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:34:03.835644Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ae2eb868-ddc4-4703-a6f1-5edb08c51c1b"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..d4edfc20 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:34:11.363371Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0b4bf562-61cd-3035-aa50-eb54f87a5cb3"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0b4bf562-61cd-3035-aa50-eb54f87a5cb3"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "24aa3fa0-19d0-40b6-9e5e-46fca9343e09"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-04-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:34:11.363371+00:00, try_number=1, job_id=262, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-04 00:00:00+00:00 +INFO - Started process 1886 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-04-04T00:00:00+00:00', '--job-id', '262', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpsi6rqg6b'] +INFO - Job 262: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498ef940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '60KInPEPLlL8zZqxxQ1ijw==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:60KInPEPLlL8zZqxxQ1ijw== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003411Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003411Z +20221111/us-east-1/s3/aws4_request +a640acdbd83c7099c6eda9567df19592539824c0bb5a427a2c01945840855261 +INFO - '2022-11-11' - botocore.auth - Signature: +c8dd688e2331cbff0344cdfd65ce51f0cbfcd7f38d2c8454d3209348925e19ee +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'EmRdVV6fLhTo2b9OZptt+IeL+M1+W0ZevLmBo63MRCVfzNRnW8rDKA97N8QKuK99GF/RutWa3gs=', 'x-amz-request-id': 'EWG7WAARW1H1K3RQ', 'Date': 'Fri, 11 Nov 2022 00:34:13 GMT', 'ETag': '"eb42889cf10f2e52fccd9ab1c50d628f"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180404T000000, start_date=20221111T003411, end_date=20221111T003414 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-04-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:34:14.101773Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "24aa3fa0-19d0-40b6-9e5e-46fca9343e09"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..68c6f743 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:34:09.147630Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0b4bf562-61cd-3035-aa50-eb54f87a5cb3"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0b4bf562-61cd-3035-aa50-eb54f87a5cb3"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2e113709-a978-4250-b3e3-5e38c7419489"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-04-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:34:09.147630+00:00, try_number=1, job_id=261, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-04 00:00:00+00:00 +INFO - Started process 1878 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-04-04T00:00:00+00:00', '--job-id', '261', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp_uz_omoy'] +INFO - Job 261: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499511f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003409Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003409Z +20221111/us-east-1/s3/aws4_request +a33afb226343c573d40d4a2525235c123be77324ac9f0548f0ad9b71649005f1 +INFO - '2022-11-11' - botocore.auth - Signature: +9ad3975fd21d7ca895ac7145c48e1b12d58896c5973c6206b3dd4dc50f11ee7f +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'yuArIQpg2vKdTFxXwpWly1ohaDiQOCl2Bj3cl5JNtNr4BryckncfmxA4lB+qzD9rKsc3LiubcPs=', 'x-amz-request-id': 'JEF4AQP0KX7YM07A', 'Date': 'Fri, 11 Nov 2022 00:34:10 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180404T000000, start_date=20221111T003409, end_date=20221111T003411 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-04-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:34:11.141206Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2e113709-a978-4250-b3e3-5e38c7419489"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..d7798722 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:34:06.611751Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0b4bf562-61cd-3035-aa50-eb54f87a5cb3"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0b4bf562-61cd-3035-aa50-eb54f87a5cb3"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fec6c2a3-1b6e-470e-bce9-182e221a58b9"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-04-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:34:06.611751+00:00, try_number=1, job_id=260, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-04 00:00:00+00:00 +INFO - Started process 1873 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-04-04T00:00:00+00:00', '--job-id', '260', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpfa5xjzk4'] +INFO - Job 260: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180404T000000, start_date=20221111T003406, end_date=20221111T003410 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-04-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:34:10.301208Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fec6c2a3-1b6e-470e-bce9-182e221a58b9"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..3ad25dde --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:34:05.173654Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0b4bf562-61cd-3035-aa50-eb54f87a5cb3"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0b4bf562-61cd-3035-aa50-eb54f87a5cb3"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "219c87d2-5347-41ac-9787-2c2258daafde"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-04-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:34:05.173654+00:00, try_number=1, job_id=259, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-04 00:00:00+00:00 +INFO - Started process 1869 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-04-04T00:00:00+00:00', '--job-id', '259', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpz183352b'] +INFO - Job 259: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180404T000000, start_date=20221111T003405, end_date=20221111T003407 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-04-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:34:07.468612Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "219c87d2-5347-41ac-9787-2c2258daafde"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..dfd052e9 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:34:15.450692Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e3beaa00-1c7d-3def-8804-811965fd3aa9"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e3beaa00-1c7d-3def-8804-811965fd3aa9"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "86a365c9-c172-454b-bcda-257615fe8a8f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-04-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:34:15.450692+00:00, try_number=1, job_id=263, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-05 00:00:00+00:00 +INFO - Started process 1988 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-04-05T00:00:00+00:00', '--job-id', '263', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpaoxr3zmx'] +INFO - Job 263: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180405T000000, start_date=20221111T003415, end_date=20221111T003418 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-04-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:34:18.278885Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "86a365c9-c172-454b-bcda-257615fe8a8f"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..4b874197 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:34:15.451829Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e3beaa00-1c7d-3def-8804-811965fd3aa9"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e3beaa00-1c7d-3def-8804-811965fd3aa9"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8b227716-f5ac-460b-9f4f-d5a834b95d53"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-04-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:34:15.451829+00:00, try_number=1, job_id=264, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-05 00:00:00+00:00 +INFO - Started process 1986 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-04-05T00:00:00+00:00', '--job-id', '264', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmptaowyqqv'] +INFO - Job 264: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180405T000000, start_date=20221111T003415, end_date=20221111T003418 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-04-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:34:18.311016Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8b227716-f5ac-460b-9f4f-d5a834b95d53"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..bf24aae0 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:34:25.631271Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e3beaa00-1c7d-3def-8804-811965fd3aa9"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e3beaa00-1c7d-3def-8804-811965fd3aa9"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bfab4df3-3eb8-48f0-ac17-48e2f9c14a6e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-04-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:34:25.631271+00:00, try_number=1, job_id=268, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-05 00:00:00+00:00 +INFO - Started process 1909 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-04-05T00:00:00+00:00', '--job-id', '268', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp3m0w41tb'] +INFO - Job 268: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498eeca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'CyOr6niZey6qwif5Mc0xEA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:CyOr6niZey6qwif5Mc0xEA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003426Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003426Z +20221111/us-east-1/s3/aws4_request +ded5640c6ad11e1c57562dd4df5b228d609b8f60ffa751b35b83c8cefe5ea40a +INFO - '2022-11-11' - botocore.auth - Signature: +250a10f45b856a3ba580bdeae790e3b5db8f415acda794c08ce67f25c2295218 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'SDFpF+syaOpzNi1XZH2uL/oDq7vDm7jSe5j46bNT9RD3j9yFpzt39WF4SsbpUTm7J1IP4qN41Vg=', 'x-amz-request-id': '6BG2VJZ5ZQZRVKRY', 'Date': 'Fri, 11 Nov 2022 00:34:27 GMT', 'ETag': '"0b23abea78997b2eaac227f931cd3110"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180405T000000, start_date=20221111T003425, end_date=20221111T003427 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-04-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:34:27.848857Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bfab4df3-3eb8-48f0-ac17-48e2f9c14a6e"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..8d37f497 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:34:24.240003Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e3beaa00-1c7d-3def-8804-811965fd3aa9"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e3beaa00-1c7d-3def-8804-811965fd3aa9"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c726d0c2-935b-41dd-aa3a-737f786ebfb4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-04-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:34:24.240003+00:00, try_number=1, job_id=267, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-05 00:00:00+00:00 +INFO - Started process 1903 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-04-05T00:00:00+00:00', '--job-id', '267', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp93nxlkg3'] +INFO - Job 267: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498ee940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003424Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003424Z +20221111/us-east-1/s3/aws4_request +9f468ecb1ec8297bdff2182c76acc98d2a45ba12669b2517f2f480c2a316a867 +INFO - '2022-11-11' - botocore.auth - Signature: +73d376b3dcf66af6dd045fbb5d7dc7eb933c16abd839b9b294b739cbda81bfba +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '6C7Zriq8v11UmqdZhyOfNnjR0kajuhoyZm7jBuZRF+IvKTN4BkygpYBXFH4Py/+7E2aEn0eJ+jo=', 'x-amz-request-id': '4R0E3YVMXX6FG09V', 'Date': 'Fri, 11 Nov 2022 00:34:25 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180405T000000, start_date=20221111T003424, end_date=20221111T003426 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-04-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:34:26.296798Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c726d0c2-935b-41dd-aa3a-737f786ebfb4"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..878c5247 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:34:20.090303Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e3beaa00-1c7d-3def-8804-811965fd3aa9"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e3beaa00-1c7d-3def-8804-811965fd3aa9"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4ee34e8b-8203-4d75-a9ee-48015c435d6e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-04-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:34:20.090303+00:00, try_number=1, job_id=265, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-05 00:00:00+00:00 +INFO - Started process 1897 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-04-05T00:00:00+00:00', '--job-id', '265', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp9g_j0mox'] +INFO - Job 265: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180405T000000, start_date=20221111T003420, end_date=20221111T003423 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-04-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:34:23.639514Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4ee34e8b-8203-4d75-a9ee-48015c435d6e"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..167a22ef --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:34:20.081519Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e3beaa00-1c7d-3def-8804-811965fd3aa9"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e3beaa00-1c7d-3def-8804-811965fd3aa9"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cb1f0c5c-9fc3-4d4f-a722-451917c2bdb8"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-04-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:34:20.081519+00:00, try_number=1, job_id=266, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-05 00:00:00+00:00 +INFO - Started process 1895 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-04-05T00:00:00+00:00', '--job-id', '266', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp1cxviyiz'] +INFO - Job 266: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180405T000000, start_date=20221111T003420, end_date=20221111T003422 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-04-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:34:22.770325Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cb1f0c5c-9fc3-4d4f-a722-451917c2bdb8"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..6547fcfb --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:34:29.449836Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42be6796-b64f-3a64-9cac-e85e3317c8d9"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42be6796-b64f-3a64-9cac-e85e3317c8d9"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "34c81234-3a8d-49be-868d-8f4d41b6ad32"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-04-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:34:29.449836+00:00, try_number=1, job_id=269, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-06 00:00:00+00:00 +INFO - Started process 1967 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-04-06T00:00:00+00:00', '--job-id', '269', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpbi35g9m5'] +INFO - Job 269: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180406T000000, start_date=20221111T003429, end_date=20221111T003432 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-04-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:34:32.874999Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "34c81234-3a8d-49be-868d-8f4d41b6ad32"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..e84346b7 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:34:29.584930Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42be6796-b64f-3a64-9cac-e85e3317c8d9"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42be6796-b64f-3a64-9cac-e85e3317c8d9"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1b141985-f710-4f73-a75c-5fcf30f9397d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-04-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:34:29.584930+00:00, try_number=1, job_id=270, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-06 00:00:00+00:00 +INFO - Started process 1977 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-04-06T00:00:00+00:00', '--job-id', '270', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp6bk9zspc'] +INFO - Job 270: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180406T000000, start_date=20221111T003429, end_date=20221111T003432 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-04-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:34:32.869522Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1b141985-f710-4f73-a75c-5fcf30f9397d"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..53b7f248 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:34:39.388260Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42be6796-b64f-3a64-9cac-e85e3317c8d9"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42be6796-b64f-3a64-9cac-e85e3317c8d9"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f27b46a3-1bb2-449c-a8a2-f0dbaedd0369"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-04-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:34:39.388260+00:00, try_number=1, job_id=274, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-06 00:00:00+00:00 +INFO - Started process 2043 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-04-06T00:00:00+00:00', '--job-id', '274', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpt0sowmyd'] +INFO - Job 274: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6ca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'HDiU4YOmP09AsFV/asm+kw==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:HDiU4YOmP09AsFV/asm+kw== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003440Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003440Z +20221111/us-east-1/s3/aws4_request +e4897cb0ac54be550d95ec27be3841f4daaba4fb06058f31827d4f5fb102e9e0 +INFO - '2022-11-11' - botocore.auth - Signature: +e42d3f5dc8961e9471c4469a5b54315549d8fb84e480ef4d25ddf1e339233bc0 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'HbWPQcIdi9a5otkrXailaofxPpR6rab1ragzUDjLM3L6yLKQcWKhPS4B6ty69j6Cc9D1XzoLVuA=', 'x-amz-request-id': 'QZKV8GVQY883J2QK', 'Date': 'Fri, 11 Nov 2022 00:34:40 GMT', 'ETag': '"1c3894e183a63f4f40b0557f6ac9be93"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180406T000000, start_date=20221111T003439, end_date=20221111T003441 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-04-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:34:41.556887Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f27b46a3-1bb2-449c-a8a2-f0dbaedd0369"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..c3b2ab12 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:34:39.354162Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42be6796-b64f-3a64-9cac-e85e3317c8d9"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42be6796-b64f-3a64-9cac-e85e3317c8d9"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4d84cac9-262b-4946-a2c9-8276f43743df"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-04-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:34:39.354162+00:00, try_number=1, job_id=273, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-06 00:00:00+00:00 +INFO - Started process 2042 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-04-06T00:00:00+00:00', '--job-id', '273', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpf4o13ylx'] +INFO - Job 273: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6ca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003440Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003440Z +20221111/us-east-1/s3/aws4_request +f710665ca830725c539c195951c12e1e593c57d89aa632f5cd13858648e6332e +INFO - '2022-11-11' - botocore.auth - Signature: +0ff38e63dde84b84a252036b089f0cb52a96cbc5ac4cbff54901f647565ba6ad +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'g1UCxi7yBH6zM9s72ngINgMoabvxh8jBERwL9Dg5m/Wj0YL8MZwzrx7W+BG+PXyjiQ+8382tuuc=', 'x-amz-request-id': 'QZKY8JPY69C1F3J9', 'Date': 'Fri, 11 Nov 2022 00:34:40 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180406T000000, start_date=20221111T003439, end_date=20221111T003441 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-04-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:34:41.567068Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4d84cac9-262b-4946-a2c9-8276f43743df"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..ac872dc2 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:34:34.339795Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42be6796-b64f-3a64-9cac-e85e3317c8d9"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42be6796-b64f-3a64-9cac-e85e3317c8d9"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "58d97661-12a3-4b66-8bd5-bf036052be85"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-04-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:34:34.339795+00:00, try_number=1, job_id=271, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-06 00:00:00+00:00 +INFO - Started process 1994 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-04-06T00:00:00+00:00', '--job-id', '271', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpszunj4r4'] +INFO - Job 271: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180406T000000, start_date=20221111T003434, end_date=20221111T003437 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-04-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:34:37.624046Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "58d97661-12a3-4b66-8bd5-bf036052be85"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..cb3c91f4 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:34:34.437851Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42be6796-b64f-3a64-9cac-e85e3317c8d9"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42be6796-b64f-3a64-9cac-e85e3317c8d9"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ddbbf6ac-5036-41e0-a666-24af9ed9a284"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-04-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:34:34.437851+00:00, try_number=1, job_id=272, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-06 00:00:00+00:00 +INFO - Started process 1996 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-04-06T00:00:00+00:00', '--job-id', '272', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpa1fcgy7f'] +INFO - Job 272: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180406T000000, start_date=20221111T003434, end_date=20221111T003437 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-04-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:34:37.496011Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ddbbf6ac-5036-41e0-a666-24af9ed9a284"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..971a0d91 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:34:43.028603Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8c543036-e62e-387d-9628-ac990f3581d7"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8c543036-e62e-387d-9628-ac990f3581d7"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e3b1feaf-1178-496e-8482-72f8619addac"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-04-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:34:43.028603+00:00, try_number=1, job_id=275, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-07 00:00:00+00:00 +INFO - Started process 2004 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-04-07T00:00:00+00:00', '--job-id', '275', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp2wncc5gu'] +INFO - Job 275: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180407T000000, start_date=20221111T003443, end_date=20221111T003446 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-04-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:34:46.003450Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e3b1feaf-1178-496e-8482-72f8619addac"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..e10eae0d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:34:43.028845Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8c543036-e62e-387d-9628-ac990f3581d7"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8c543036-e62e-387d-9628-ac990f3581d7"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "476becfe-305f-43e4-9560-c0ab7747a5fc"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-04-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:34:43.028845+00:00, try_number=1, job_id=276, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-07 00:00:00+00:00 +INFO - Started process 2006 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-04-07T00:00:00+00:00', '--job-id', '276', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpvsib7gxw'] +INFO - Job 276: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180407T000000, start_date=20221111T003443, end_date=20221111T003446 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-04-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:34:46.003342Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "476becfe-305f-43e4-9560-c0ab7747a5fc"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..5d151190 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:34:52.905586Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8c543036-e62e-387d-9628-ac990f3581d7"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8c543036-e62e-387d-9628-ac990f3581d7"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ed83d309-ad5f-4d62-bd2d-206d73a542fa"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-04-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:34:52.905586+00:00, try_number=1, job_id=280, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-07 00:00:00+00:00 +INFO - Started process 2018 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-04-07T00:00:00+00:00', '--job-id', '280', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp9ffcriul'] +INFO - Job 280: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0ca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'yEVztx+tEjBU43P7raxBHg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:yEVztx+tEjBU43P7raxBHg== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003453Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003453Z +20221111/us-east-1/s3/aws4_request +ed648a31565d994c84a43919b486e81bb3f7e59ce49fa97f1c32c11d5ba7cf6f +INFO - '2022-11-11' - botocore.auth - Signature: +d6edf4880049ea1131ac6b9d62e7e1b880d35b28b7f5e13157e9d8cd63aa0997 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'pehaeiINfnG3W7BqEiwGnGTy0OoeszAnBgLQeVFJD/TYA9h7ElP+6psYDtnSt2keOhqGvxz+lpk=', 'x-amz-request-id': '2D3ZT4NV5SNM6CNB', 'Date': 'Fri, 11 Nov 2022 00:34:54 GMT', 'ETag': '"c84573b71fad123054e373fbadac411e"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180407T000000, start_date=20221111T003452, end_date=20221111T003455 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-04-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:34:55.212190Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ed83d309-ad5f-4d62-bd2d-206d73a542fa"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..b946d371 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:34:51.145778Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8c543036-e62e-387d-9628-ac990f3581d7"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8c543036-e62e-387d-9628-ac990f3581d7"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "34c72666-8021-408c-b577-e16144b64383"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-04-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:34:51.145778+00:00, try_number=1, job_id=279, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-07 00:00:00+00:00 +INFO - Started process 2013 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-04-07T00:00:00+00:00', '--job-id', '279', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp6c4fb1bf'] +INFO - Job 279: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499553a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003452Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003452Z +20221111/us-east-1/s3/aws4_request +75d20cdd12cba1381092b42ac420e069f1cd97bdb40373a85c9b97301b40831a +INFO - '2022-11-11' - botocore.auth - Signature: +f66b35d19f3067fa72dd57fa0dfff7709f50b6b5d07c38453d2fea8bc40fe0fd +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'MdcSwAON9gZY3KVAF8sPg3x4wvyOb1B40h9z1qTRsHY9FTBx3IDO58XFDh4udh/HSSMZeA1pVRc=', 'x-amz-request-id': 'M71JGXKCQAQWGN32', 'Date': 'Fri, 11 Nov 2022 00:34:52 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180407T000000, start_date=20221111T003451, end_date=20221111T003453 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-04-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:34:53.551430Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "34c72666-8021-408c-b577-e16144b64383"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..3d87617c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:34:47.206919Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8c543036-e62e-387d-9628-ac990f3581d7"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8c543036-e62e-387d-9628-ac990f3581d7"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6d66173c-3b3c-45de-ac44-bf7f576a7823"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-04-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:34:47.206919+00:00, try_number=1, job_id=278, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-07 00:00:00+00:00 +INFO - Started process 2077 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-04-07T00:00:00+00:00', '--job-id', '278', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp39x38d0u'] +INFO - Job 278: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180407T000000, start_date=20221111T003447, end_date=20221111T003451 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-04-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:34:51.106236Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6d66173c-3b3c-45de-ac44-bf7f576a7823"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..e40b17bc --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:34:47.180813Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8c543036-e62e-387d-9628-ac990f3581d7"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8c543036-e62e-387d-9628-ac990f3581d7"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c2b3b4ab-720d-4a72-a161-4e8a92c272bb"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-04-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:34:47.180813+00:00, try_number=1, job_id=277, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-07 00:00:00+00:00 +INFO - Started process 2075 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-04-07T00:00:00+00:00', '--job-id', '277', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp7qgkwwy_'] +INFO - Job 277: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180407T000000, start_date=20221111T003447, end_date=20221111T003449 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-04-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:34:49.697565Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c2b3b4ab-720d-4a72-a161-4e8a92c272bb"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..0298f03a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:34:57.138166Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0de47ec6-fd4b-30de-a10b-c3bf4ff5dade"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0de47ec6-fd4b-30de-a10b-c3bf4ff5dade"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8acf318a-afde-4272-8d6b-49905bbdc937"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-04-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:34:57.138166+00:00, try_number=1, job_id=281, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-08 00:00:00+00:00 +INFO - Started process 2027 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-04-08T00:00:00+00:00', '--job-id', '281', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpbm9nppvx'] +INFO - Job 281: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180408T000000, start_date=20221111T003457, end_date=20221111T003500 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-04-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:35:00.630204Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8acf318a-afde-4272-8d6b-49905bbdc937"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..81355749 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:34:57.598778Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0de47ec6-fd4b-30de-a10b-c3bf4ff5dade"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0de47ec6-fd4b-30de-a10b-c3bf4ff5dade"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "28e39138-3185-4277-9b33-4582e753d1f2"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-04-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:34:57.598778+00:00, try_number=1, job_id=282, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-08 00:00:00+00:00 +INFO - Started process 2036 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-04-08T00:00:00+00:00', '--job-id', '282', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp7rtivsmk'] +INFO - Job 282: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180408T000000, start_date=20221111T003457, end_date=20221111T003501 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-04-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:35:01.362545Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "28e39138-3185-4277-9b33-4582e753d1f2"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..c838c100 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:35:13.495941Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0de47ec6-fd4b-30de-a10b-c3bf4ff5dade"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0de47ec6-fd4b-30de-a10b-c3bf4ff5dade"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5820d993-bd83-45d6-b825-7f9320fd8f36"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-04-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:35:13.495941+00:00, try_number=1, job_id=286, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-08 00:00:00+00:00 +INFO - Started process 2113 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-04-08T00:00:00+00:00', '--job-id', '286', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpz2uvfz7s'] +INFO - Job 286: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0ee0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'yEVztx+tEjBU43P7raxBHg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:yEVztx+tEjBU43P7raxBHg== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003514Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003514Z +20221111/us-east-1/s3/aws4_request +1a7c7f662cbdd2da3d95579462282c66a34e517b108fa178ec516378158f862f +INFO - '2022-11-11' - botocore.auth - Signature: +d5ae99d606bbdbba9b36fe1e490796417c3be3c8c57af02a999415486df4ebf1 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'bqAejoh2KENFv8JtRGtiAJn+/tSzfgpBrqPoIgnJ97c5yUcfnpzq3/FZQJrpdhX1SEAqBMKkLmQ=', 'x-amz-request-id': '7P0F1BH1ESEHH9DH', 'Date': 'Fri, 11 Nov 2022 00:35:15 GMT', 'ETag': '"c84573b71fad123054e373fbadac411e"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180408T000000, start_date=20221111T003513, end_date=20221111T003516 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-04-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:35:16.177858Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5820d993-bd83-45d6-b825-7f9320fd8f36"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..053fdfb1 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:35:08.899495Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0de47ec6-fd4b-30de-a10b-c3bf4ff5dade"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0de47ec6-fd4b-30de-a10b-c3bf4ff5dade"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "846eb1b0-c033-4b75-a44d-7a4f326371ea"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-04-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:35:08.899495+00:00, try_number=1, job_id=285, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-08 00:00:00+00:00 +INFO - Started process 2106 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-04-08T00:00:00+00:00', '--job-id', '285', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpmkl2m0bx'] +INFO - Job 285: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499543a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003510Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003510Z +20221111/us-east-1/s3/aws4_request +3280c4e3be6f1ce4ad81f876abb6f55091355df0003bcd3f5f8e2046bfc5650a +INFO - '2022-11-11' - botocore.auth - Signature: +f1e7d4d659bcf24888693a239f3285855abcbd8ae78590580709d2b2c31a9d75 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'TxxsGUcmWUtraY44pyyaqE1nR5iBK7VhqnhXbVn3ZXfExknFWB6TzyE5vy2apAGr5LL1xkBCNtk=', 'x-amz-request-id': 'STKNAPKVS94282DE', 'Date': 'Fri, 11 Nov 2022 00:35:10 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180408T000000, start_date=20221111T003508, end_date=20221111T003511 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-04-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:35:11.769006Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "846eb1b0-c033-4b75-a44d-7a4f326371ea"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..2f4c5d07 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:35:03.538177Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0de47ec6-fd4b-30de-a10b-c3bf4ff5dade"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0de47ec6-fd4b-30de-a10b-c3bf4ff5dade"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "542bebf2-345a-4138-80c3-a9ab985477e7"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-04-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:35:03.538177+00:00, try_number=1, job_id=284, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-08 00:00:00+00:00 +INFO - Started process 2108 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-04-08T00:00:00+00:00', '--job-id', '284', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpp9r9necw'] +INFO - Job 284: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180408T000000, start_date=20221111T003503, end_date=20221111T003511 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-04-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:35:11.518245Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "542bebf2-345a-4138-80c3-a9ab985477e7"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..901831af --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:35:03.407585Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0de47ec6-fd4b-30de-a10b-c3bf4ff5dade"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0de47ec6-fd4b-30de-a10b-c3bf4ff5dade"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "579de2df-0ae9-4a63-9f76-f8d4d9558bdb"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-04-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:35:03.407585+00:00, try_number=1, job_id=283, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-08 00:00:00+00:00 +INFO - Started process 2101 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-04-08T00:00:00+00:00', '--job-id', '283', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmppxf0wjj9'] +INFO - Job 283: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180408T000000, start_date=20221111T003503, end_date=20221111T003507 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-04-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:35:07.156121Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "579de2df-0ae9-4a63-9f76-f8d4d9558bdb"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..7d016662 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:35:19.476606Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "afc738bf-02b1-3d20-bc28-bd8ca31e6d97"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "afc738bf-02b1-3d20-bc28-bd8ca31e6d97"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e2f6fccb-f69b-4deb-97d8-f34d684e7a46"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-04-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:35:19.476606+00:00, try_number=1, job_id=287, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-09 00:00:00+00:00 +INFO - Started process 2121 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-04-09T00:00:00+00:00', '--job-id', '287', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpt7c7ubc4'] +INFO - Job 287: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180409T000000, start_date=20221111T003519, end_date=20221111T003523 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-04-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:35:23.201972Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e2f6fccb-f69b-4deb-97d8-f34d684e7a46"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..7c63823c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:35:19.831414Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "afc738bf-02b1-3d20-bc28-bd8ca31e6d97"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "afc738bf-02b1-3d20-bc28-bd8ca31e6d97"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "02507224-fea4-4890-8ecb-efcc8bb26031"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-04-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:35:19.831414+00:00, try_number=1, job_id=288, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-09 00:00:00+00:00 +INFO - Started process 2124 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-04-09T00:00:00+00:00', '--job-id', '288', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp7fqj7ifo'] +INFO - Job 288: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180409T000000, start_date=20221111T003519, end_date=20221111T003523 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-04-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:35:23.188941Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "02507224-fea4-4890-8ecb-efcc8bb26031"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..6a8f68b5 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:35:32.065826Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "afc738bf-02b1-3d20-bc28-bd8ca31e6d97"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "afc738bf-02b1-3d20-bc28-bd8ca31e6d97"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fcde6a10-4b4c-44c1-be73-b0dc6859781d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-04-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:35:32.065826+00:00, try_number=1, job_id=292, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-09 00:00:00+00:00 +INFO - Started process 2206 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-04-09T00:00:00+00:00', '--job-id', '292', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpyia7h912'] +INFO - Job 292: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498ef940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'WL5L7Z60E6izwc8htiXOLA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:WL5L7Z60E6izwc8htiXOLA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003532Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003532Z +20221111/us-east-1/s3/aws4_request +8aa2600e3a561eb8dc6c36a6ec753da52441db1180496a7cd20eb591d14f4acd +INFO - '2022-11-11' - botocore.auth - Signature: +dbceb98ee7dd9831ec11bd42b1550627d21dc7a5137b7f010d76c02f621a9ea9 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'XPIP8gZsPkllRbrilnoMQ89U5HUtaG8Ee23hr71dZcr8dux8/Iw+CBqXH5RdhgO7zbSy9A5yJ+o=', 'x-amz-request-id': 'DJ54N6G8VVVV72H3', 'Date': 'Fri, 11 Nov 2022 00:35:33 GMT', 'ETag': '"58be4bed9eb413a8b3c1cf21b625ce2c"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180409T000000, start_date=20221111T003532, end_date=20221111T003534 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-04-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:35:34.009211Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fcde6a10-4b4c-44c1-be73-b0dc6859781d"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..8ef5c695 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:35:29.978356Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "afc738bf-02b1-3d20-bc28-bd8ca31e6d97"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "afc738bf-02b1-3d20-bc28-bd8ca31e6d97"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0bf9e424-50a6-4a0e-a65b-d14ee02b40b1"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-04-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:35:29.978356+00:00, try_number=1, job_id=291, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-09 00:00:00+00:00 +INFO - Started process 2168 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-04-09T00:00:00+00:00', '--job-id', '291', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpfntxhity'] +INFO - Job 291: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003530Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003530Z +20221111/us-east-1/s3/aws4_request +5a4e1956d696f8166c991251c84e59ea206f43b6751d436a2d0744cb4d4e7ee0 +INFO - '2022-11-11' - botocore.auth - Signature: +57075c9be7cf66cd41827138a29a6e470d33824db0ab661aab3bc320dd087187 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'EFiLsD/+86qKgXCTLCCFUpRGL5oLZAg2QdSK1MxxHV+qN9fAOtdHnkqcHFFK/0LSlisVqJiVnho=', 'x-amz-request-id': 'R7XPWDAM3RSPQBS8', 'Date': 'Fri, 11 Nov 2022 00:35:31 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180409T000000, start_date=20221111T003529, end_date=20221111T003532 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-04-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:35:32.374327Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0bf9e424-50a6-4a0e-a65b-d14ee02b40b1"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..72055cef --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:35:25.046303Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "afc738bf-02b1-3d20-bc28-bd8ca31e6d97"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "afc738bf-02b1-3d20-bc28-bd8ca31e6d97"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "dc3b755f-9e8c-418e-9ddf-d454105be02a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-04-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:35:25.046303+00:00, try_number=1, job_id=290, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-09 00:00:00+00:00 +INFO - Started process 2134 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-04-09T00:00:00+00:00', '--job-id', '290', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpqrdswm2h'] +INFO - Job 290: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180409T000000, start_date=20221111T003525, end_date=20221111T003529 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-04-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:35:29.604651Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "dc3b755f-9e8c-418e-9ddf-d454105be02a"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..e5bee9e8 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:35:24.945713Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "afc738bf-02b1-3d20-bc28-bd8ca31e6d97"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "afc738bf-02b1-3d20-bc28-bd8ca31e6d97"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a6ec0031-d35a-4bfd-8a90-d894041a28a0"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-04-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:35:24.945713+00:00, try_number=1, job_id=289, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-09 00:00:00+00:00 +INFO - Started process 2132 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-04-09T00:00:00+00:00', '--job-id', '289', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmplhyjw1qy'] +INFO - Job 289: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180409T000000, start_date=20221111T003524, end_date=20221111T003528 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-04-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:35:28.314225Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a6ec0031-d35a-4bfd-8a90-d894041a28a0"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..047df496 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:35:35.651311Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "966e448a-08b1-3a67-bae1-e0806dbf735c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "966e448a-08b1-3a67-bae1-e0806dbf735c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0d075d05-8273-45b1-8856-faeda7257f5c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-04-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:35:35.651311+00:00, try_number=1, job_id=294, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-10 00:00:00+00:00 +INFO - Started process 2223 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-04-10T00:00:00+00:00', '--job-id', '294', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp7an67n7j'] +INFO - Job 294: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180410T000000, start_date=20221111T003535, end_date=20221111T003539 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-04-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:35:39.194229Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0d075d05-8273-45b1-8856-faeda7257f5c"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..0d297284 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:35:35.617643Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "966e448a-08b1-3a67-bae1-e0806dbf735c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "966e448a-08b1-3a67-bae1-e0806dbf735c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "99b74815-c7b6-4925-bc9c-a74374c15cd1"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-04-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:35:35.617643+00:00, try_number=1, job_id=293, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-10 00:00:00+00:00 +INFO - Started process 2222 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-04-10T00:00:00+00:00', '--job-id', '293', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp9l5cc_09'] +INFO - Job 293: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180410T000000, start_date=20221111T003535, end_date=20221111T003539 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-04-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:35:39.179557Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "99b74815-c7b6-4925-bc9c-a74374c15cd1"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..d0d87321 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:35:45.339378Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "966e448a-08b1-3a67-bae1-e0806dbf735c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "966e448a-08b1-3a67-bae1-e0806dbf735c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "09f96d30-89dc-4d5c-8613-2803e21dc2ab"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-04-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:35:45.339378+00:00, try_number=1, job_id=298, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-10 00:00:00+00:00 +INFO - Started process 2233 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-04-10T00:00:00+00:00', '--job-id', '298', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmph0xb217z'] +INFO - Job 298: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498ef940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'WL5L7Z60E6izwc8htiXOLA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:WL5L7Z60E6izwc8htiXOLA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003546Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003546Z +20221111/us-east-1/s3/aws4_request +f5829532271d9d9ad10e7c118030b57348558671082ca442c0523738d641adf6 +INFO - '2022-11-11' - botocore.auth - Signature: +3931d5cd42c12480fa3c63209f6de0f4765d0c837b5dbbdb7798b1afd2ca0448 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'mUkYF1MO+E8lwrwYAobv++QZUnb8+6iXRuhodAKFt6phOAxDua6n811FxGJasrOp4g2acAoYz0s=', 'x-amz-request-id': 'PH9T69J1ZZF8T3VM', 'Date': 'Fri, 11 Nov 2022 00:35:46 GMT', 'ETag': '"58be4bed9eb413a8b3c1cf21b625ce2c"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180410T000000, start_date=20221111T003545, end_date=20221111T003547 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-04-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:35:47.514835Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "09f96d30-89dc-4d5c-8613-2803e21dc2ab"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..278b0319 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:35:45.227784Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "966e448a-08b1-3a67-bae1-e0806dbf735c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "966e448a-08b1-3a67-bae1-e0806dbf735c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7dc2d216-2d26-415a-8db4-784f9ea2a674"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-04-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:35:45.227784+00:00, try_number=1, job_id=297, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-10 00:00:00+00:00 +INFO - Started process 2230 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-04-10T00:00:00+00:00', '--job-id', '297', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpx7soec8b'] +INFO - Job 297: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498ef940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003545Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003545Z +20221111/us-east-1/s3/aws4_request +470d44c28a2a143b544c160d7bc5784ba7937d7a894036e5f68ab376c8d63b9b +INFO - '2022-11-11' - botocore.auth - Signature: +c005f30ae92dff6e67d6f68148e1a71544a350bb0a21702db3e4c95324bb8785 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'cA5qSx+BUk4SLONbvgAg/ZqOezPP1Uc8/auEPnEaLKC87pKdhu+5INTBCl3f/EhGnUaoKpxG9yQ=', 'x-amz-request-id': 'PH9WZZ95J1ZAMPTE', 'Date': 'Fri, 11 Nov 2022 00:35:46 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180410T000000, start_date=20221111T003545, end_date=20221111T003547 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-04-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:35:47.222336Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7dc2d216-2d26-415a-8db4-784f9ea2a674"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..e3c850c0 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:35:40.580421Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "966e448a-08b1-3a67-bae1-e0806dbf735c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "966e448a-08b1-3a67-bae1-e0806dbf735c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c3c6ae44-6c39-4724-a190-a99a761d05d4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-04-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:35:40.580421+00:00, try_number=1, job_id=295, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-10 00:00:00+00:00 +INFO - Started process 2200 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-04-10T00:00:00+00:00', '--job-id', '295', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpjzr5z4mz'] +INFO - Job 295: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180410T000000, start_date=20221111T003540, end_date=20221111T003543 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-04-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:35:43.959692Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c3c6ae44-6c39-4724-a190-a99a761d05d4"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..7d9829ae --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:35:40.590093Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "966e448a-08b1-3a67-bae1-e0806dbf735c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "966e448a-08b1-3a67-bae1-e0806dbf735c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b7a57fe0-a1bf-467a-93cc-57709a9668b4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-04-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:35:40.590093+00:00, try_number=1, job_id=296, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-10 00:00:00+00:00 +INFO - Started process 2202 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-04-10T00:00:00+00:00', '--job-id', '296', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpd5jwka0o'] +INFO - Job 296: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180410T000000, start_date=20221111T003540, end_date=20221111T003543 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-04-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:35:43.578517Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b7a57fe0-a1bf-467a-93cc-57709a9668b4"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..f0c9406b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:35:49.090101Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d73d109a-2e36-3932-88d2-8c42b921cc16"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d73d109a-2e36-3932-88d2-8c42b921cc16"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f2bf39d6-1ebb-4d40-b5cb-0094961bf186"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-04-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:35:49.090101+00:00, try_number=1, job_id=299, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-11 00:00:00+00:00 +INFO - Started process 2231 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-04-11T00:00:00+00:00', '--job-id', '299', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpnf17cpfm'] +INFO - Job 299: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180411T000000, start_date=20221111T003549, end_date=20221111T003552 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-04-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:35:52.285237Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f2bf39d6-1ebb-4d40-b5cb-0094961bf186"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..c7412136 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:35:49.099951Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d73d109a-2e36-3932-88d2-8c42b921cc16"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d73d109a-2e36-3932-88d2-8c42b921cc16"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a459e248-bd66-4d47-ae57-a585086ef235"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-04-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:35:49.099951+00:00, try_number=1, job_id=300, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-11 00:00:00+00:00 +INFO - Started process 2232 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-04-11T00:00:00+00:00', '--job-id', '300', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpabjlgl6x'] +INFO - Job 300: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180411T000000, start_date=20221111T003549, end_date=20221111T003552 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-04-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:35:52.285233Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a459e248-bd66-4d47-ae57-a585086ef235"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..c0bdea38 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:35:58.999029Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d73d109a-2e36-3932-88d2-8c42b921cc16"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d73d109a-2e36-3932-88d2-8c42b921cc16"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8ad37314-3df7-4acd-8722-2bd62a84a6e4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-04-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:35:58.999029+00:00, try_number=1, job_id=304, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-11 00:00:00+00:00 +INFO - Started process 2257 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-04-11T00:00:00+00:00', '--job-id', '304', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpuwr904kr'] +INFO - Job 304: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'WL5L7Z60E6izwc8htiXOLA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:WL5L7Z60E6izwc8htiXOLA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003559Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003559Z +20221111/us-east-1/s3/aws4_request +163bc06c8439ed17a73d651057b3b627d1cd1b4741a14d87653de511954519e0 +INFO - '2022-11-11' - botocore.auth - Signature: +84c9c8c19e4e1a07a5f7fb2451bea2157bf559b34dfe341a110a8099d042e2e4 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '231a+lXbFvM53Hxn0MRnikN/nVxViq4DMY2p7L9J22XOtMLbJ1dJwI3kjAaDMdmJ03F4qJbDvB8=', 'x-amz-request-id': 'RQGF9KNA3NYAAE6X', 'Date': 'Fri, 11 Nov 2022 00:36:00 GMT', 'ETag': '"58be4bed9eb413a8b3c1cf21b625ce2c"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180411T000000, start_date=20221111T003558, end_date=20221111T003601 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-04-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:36:01.023179Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8ad37314-3df7-4acd-8722-2bd62a84a6e4"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..c37019f9 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:35:57.337537Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d73d109a-2e36-3932-88d2-8c42b921cc16"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d73d109a-2e36-3932-88d2-8c42b921cc16"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b47592ab-d0ee-457c-a7be-cec6794c2696"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-04-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:35:57.337537+00:00, try_number=1, job_id=303, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-11 00:00:00+00:00 +INFO - Started process 2272 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-04-11T00:00:00+00:00', '--job-id', '303', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpcjl2mc_b'] +INFO - Job 303: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50031f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003558Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003558Z +20221111/us-east-1/s3/aws4_request +4e9eeb84075bd4ccde049dfba0f7e9dc20512799528ca4c385d2796946e5779e +INFO - '2022-11-11' - botocore.auth - Signature: +b89a47d3b083f49a9116b756fbe7b9acc9649c1def30f05e35ee1820344a6b11 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'kiC1kxm63Ngr0hH5qaYoSF7cEpdbG8OBjgwtOnglplppuac/f3lohFdhHh5K1kBnUTzdkmGySTY=', 'x-amz-request-id': 'QMH6ZX3ZKEZ7YJ8R', 'Date': 'Fri, 11 Nov 2022 00:35:58 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180411T000000, start_date=20221111T003557, end_date=20221111T003559 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-04-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:35:59.397733Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b47592ab-d0ee-457c-a7be-cec6794c2696"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..c92ed4a9 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:35:53.659941Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d73d109a-2e36-3932-88d2-8c42b921cc16"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d73d109a-2e36-3932-88d2-8c42b921cc16"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2f9b29d2-a993-4777-877d-815a9eec3f7f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-04-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:35:53.659941+00:00, try_number=1, job_id=302, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-11 00:00:00+00:00 +INFO - Started process 2267 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-04-11T00:00:00+00:00', '--job-id', '302', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmptxezwku4'] +INFO - Job 302: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180411T000000, start_date=20221111T003553, end_date=20221111T003557 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-04-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:35:57.703819Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2f9b29d2-a993-4777-877d-815a9eec3f7f"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..2d28bfdf --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:35:53.646554Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d73d109a-2e36-3932-88d2-8c42b921cc16"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d73d109a-2e36-3932-88d2-8c42b921cc16"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3062ca54-7cb1-4883-8c7a-a37c2234c3b1"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-04-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:35:53.646554+00:00, try_number=1, job_id=301, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-11 00:00:00+00:00 +INFO - Started process 2266 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-04-11T00:00:00+00:00', '--job-id', '301', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp9xs71hcn'] +INFO - Job 301: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180411T000000, start_date=20221111T003553, end_date=20221111T003555 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-04-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:35:55.931069Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3062ca54-7cb1-4883-8c7a-a37c2234c3b1"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..b52bd63c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:36:03.315006Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ce2477a9-5a41-33e6-ba51-cecd1bbe99d0"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ce2477a9-5a41-33e6-ba51-cecd1bbe99d0"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "da91a18c-2548-49ac-8b3a-52abaf43e99a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-04-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:36:03.315006+00:00, try_number=1, job_id=305, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-12 00:00:00+00:00 +INFO - Started process 2282 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-04-12T00:00:00+00:00', '--job-id', '305', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpa5wn7rlh'] +INFO - Job 305: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180412T000000, start_date=20221111T003603, end_date=20221111T003606 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-04-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:36:06.394759Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "da91a18c-2548-49ac-8b3a-52abaf43e99a"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..604ec98e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:36:03.330303Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ce2477a9-5a41-33e6-ba51-cecd1bbe99d0"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ce2477a9-5a41-33e6-ba51-cecd1bbe99d0"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "639ae67b-0248-43c2-80ba-ee404b9b628a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-04-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:36:03.330303+00:00, try_number=1, job_id=306, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-12 00:00:00+00:00 +INFO - Started process 2284 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-04-12T00:00:00+00:00', '--job-id', '306', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpg4scwzuf'] +INFO - Job 306: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180412T000000, start_date=20221111T003603, end_date=20221111T003606 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-04-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:36:06.402363Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "639ae67b-0248-43c2-80ba-ee404b9b628a"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..6030a560 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:36:13.658840Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ce2477a9-5a41-33e6-ba51-cecd1bbe99d0"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ce2477a9-5a41-33e6-ba51-cecd1bbe99d0"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5e41d016-f34a-4f9f-a677-334df637e190"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-04-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:36:13.658840+00:00, try_number=1, job_id=310, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-12 00:00:00+00:00 +INFO - Started process 2326 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-04-12T00:00:00+00:00', '--job-id', '310', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpwmcfdjs5'] +INFO - Job 310: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'y7W0XePeuxefSOeELQhCiA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:y7W0XePeuxefSOeELQhCiA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003614Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003614Z +20221111/us-east-1/s3/aws4_request +dc3dc89f8088bdf1d729d1a6588cbe1ce207d59e61f41a9526b55d0fb119393f +INFO - '2022-11-11' - botocore.auth - Signature: +73ca992a2744c95673d8fbc6ddb4aa780f60856c9423f0fb9a683a1e0e6509e6 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '8ayUVLt5gjfHHH1EjhcIRvYvjfMmzSPAQT/CicbieI3DdH/Aq88Fh6psHm+BN2x4kepaHibnjG4=', 'x-amz-request-id': 'WGQPFYGXNV8T3VW8', 'Date': 'Fri, 11 Nov 2022 00:36:14 GMT', 'ETag': '"cbb5b45de3debb179f48e7842d084288"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180412T000000, start_date=20221111T003613, end_date=20221111T003615 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-04-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:36:15.497085Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5e41d016-f34a-4f9f-a677-334df637e190"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..a17860a3 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:36:12.322315Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ce2477a9-5a41-33e6-ba51-cecd1bbe99d0"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ce2477a9-5a41-33e6-ba51-cecd1bbe99d0"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4f8e9947-17f6-4a00-91c7-a9a792e30129"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-04-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:36:12.322315+00:00, try_number=1, job_id=309, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-12 00:00:00+00:00 +INFO - Started process 2320 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-04-12T00:00:00+00:00', '--job-id', '309', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp76beufg8'] +INFO - Job 309: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa4940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003612Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003612Z +20221111/us-east-1/s3/aws4_request +6f664647208e37a77abb005489dbd218b293cfbe4e2e27138cafeb340b42d5c2 +INFO - '2022-11-11' - botocore.auth - Signature: +758dfd21efb3627876e0271c4d4176fb7e1e472261324039d56e96109cc07efa +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'jCjC3wVlfUes/pBhPzReMiy8qKlfzyyh6k+o3FyENLM1RBgh7ahivOWpyAELOPHFoNO09DAUoco=', 'x-amz-request-id': '9Z4G4M1002VQ6E6G', 'Date': 'Fri, 11 Nov 2022 00:36:13 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180412T000000, start_date=20221111T003612, end_date=20221111T003614 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-04-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:36:14.159127Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4f8e9947-17f6-4a00-91c7-a9a792e30129"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..2d37e502 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:36:07.657848Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ce2477a9-5a41-33e6-ba51-cecd1bbe99d0"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ce2477a9-5a41-33e6-ba51-cecd1bbe99d0"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6a24c399-5ec5-41cc-a9e7-c6b54d35afce"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-04-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:36:07.657848+00:00, try_number=1, job_id=307, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-12 00:00:00+00:00 +INFO - Started process 2292 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-04-12T00:00:00+00:00', '--job-id', '307', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpwut3n6w3'] +INFO - Job 307: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180412T000000, start_date=20221111T003607, end_date=20221111T003611 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-04-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:36:11.655784Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6a24c399-5ec5-41cc-a9e7-c6b54d35afce"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..52c968d7 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:36:07.714259Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ce2477a9-5a41-33e6-ba51-cecd1bbe99d0"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ce2477a9-5a41-33e6-ba51-cecd1bbe99d0"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5bf91144-8f83-4ccd-ac97-ea9da4316eee"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-04-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:36:07.714259+00:00, try_number=1, job_id=308, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-12 00:00:00+00:00 +INFO - Started process 2300 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-04-12T00:00:00+00:00', '--job-id', '308', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpiscfr7c6'] +INFO - Job 308: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180412T000000, start_date=20221111T003607, end_date=20221111T003610 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-04-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:36:10.422747Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5bf91144-8f83-4ccd-ac97-ea9da4316eee"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..c11d1d6d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:36:17.483526Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5fca4a59-ea2a-3deb-b7c4-43daf0012281"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5fca4a59-ea2a-3deb-b7c4-43daf0012281"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "caaca69a-a4bd-4b6b-ac4c-4b949f900c51"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-04-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:36:17.483526+00:00, try_number=1, job_id=311, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-13 00:00:00+00:00 +INFO - Started process 2318 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-04-13T00:00:00+00:00', '--job-id', '311', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmphnkzqhxv'] +INFO - Job 311: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180413T000000, start_date=20221111T003617, end_date=20221111T003620 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-04-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:36:20.514584Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "caaca69a-a4bd-4b6b-ac4c-4b949f900c51"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..2a273daa --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:36:17.501402Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5fca4a59-ea2a-3deb-b7c4-43daf0012281"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5fca4a59-ea2a-3deb-b7c4-43daf0012281"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c63ef6e1-2fdf-4e45-ba80-24add56fdbba"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-04-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:36:17.501402+00:00, try_number=1, job_id=312, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-13 00:00:00+00:00 +INFO - Started process 2319 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-04-13T00:00:00+00:00', '--job-id', '312', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpw29u7tw5'] +INFO - Job 312: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180413T000000, start_date=20221111T003617, end_date=20221111T003620 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-04-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:36:20.504088Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c63ef6e1-2fdf-4e45-ba80-24add56fdbba"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..5de5893a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:36:28.942395Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5fca4a59-ea2a-3deb-b7c4-43daf0012281"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5fca4a59-ea2a-3deb-b7c4-43daf0012281"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "627b1e48-c8a4-4011-be38-2c0db938ba01"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-04-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:36:28.942395+00:00, try_number=1, job_id=316, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-13 00:00:00+00:00 +INFO - Started process 2384 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-04-13T00:00:00+00:00', '--job-id', '316', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpqxpwog8s'] +INFO - Job 316: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5ca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'klmwpUetbmEH02dr/0x27w==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:klmwpUetbmEH02dr/0x27w== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003629Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003629Z +20221111/us-east-1/s3/aws4_request +d27acbf0a457056fa522b4b4e7550de1ea8f2c76467f5297411a66d78b0dcc42 +INFO - '2022-11-11' - botocore.auth - Signature: +165e52e4af909c01a4e809e484fbd6505e870d7baee4f9c962dbe5ad8f44f12d +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'klkU3ElWOoQ3L3hLN9PoD464jbGnoSoMpoXh+874rgPvPVjTcWQxAxzXY3nvAT4uCSdJMNvhpTE=', 'x-amz-request-id': '19WF97R858X6EVZC', 'Date': 'Fri, 11 Nov 2022 00:36:30 GMT', 'ETag': '"9259b0a547ad6e6107d3676bff4c76ef"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180413T000000, start_date=20221111T003628, end_date=20221111T003630 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-04-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:36:30.859828Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "627b1e48-c8a4-4011-be38-2c0db938ba01"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..eb7e6c19 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:36:26.747828Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5fca4a59-ea2a-3deb-b7c4-43daf0012281"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5fca4a59-ea2a-3deb-b7c4-43daf0012281"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "46e056e0-457a-4d83-a696-9540cfa04b11"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-04-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:36:26.747828+00:00, try_number=1, job_id=315, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-13 00:00:00+00:00 +INFO - Started process 2330 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-04-13T00:00:00+00:00', '--job-id', '315', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpqkge88qp'] +INFO - Job 315: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499511f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003627Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003627Z +20221111/us-east-1/s3/aws4_request +f1676d8b11e6d8fb70b0c43e2fc19910ad7a85ec85171b468e52e25a5e0d9e13 +INFO - '2022-11-11' - botocore.auth - Signature: +45de05617e9486da6aaf807193bb6d5b504a5a3a9bcead84e6ae885191e43f6f +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'mD8wpPEsCntsnUvGDeNfRIwS2PEYRL6U/aMffRS8+alDl3XOcPRAT7mpRhSylPk0wZll1ivnNbQ=', 'x-amz-request-id': '2S08N0ANG8KR7165', 'Date': 'Fri, 11 Nov 2022 00:36:28 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180413T000000, start_date=20221111T003626, end_date=20221111T003628 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-04-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:36:28.706498Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "46e056e0-457a-4d83-a696-9540cfa04b11"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..4ff47b15 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:36:21.963843Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5fca4a59-ea2a-3deb-b7c4-43daf0012281"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5fca4a59-ea2a-3deb-b7c4-43daf0012281"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0e92071e-70bd-4271-aa1e-82142df8391f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-04-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:36:21.963843+00:00, try_number=1, job_id=314, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-13 00:00:00+00:00 +INFO - Started process 2369 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-04-13T00:00:00+00:00', '--job-id', '314', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp_17g7dnc'] +INFO - Job 314: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180413T000000, start_date=20221111T003621, end_date=20221111T003627 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-04-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:36:27.169601Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0e92071e-70bd-4271-aa1e-82142df8391f"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..fd54a094 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:36:21.876746Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5fca4a59-ea2a-3deb-b7c4-43daf0012281"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5fca4a59-ea2a-3deb-b7c4-43daf0012281"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "65ea301a-8b5d-4109-a188-d9b7e2659e42"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-04-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:36:21.876746+00:00, try_number=1, job_id=313, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-13 00:00:00+00:00 +INFO - Started process 2325 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-04-13T00:00:00+00:00', '--job-id', '313', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpdtl8decq'] +INFO - Job 313: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180413T000000, start_date=20221111T003621, end_date=20221111T003624 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-04-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:36:24.571333Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "65ea301a-8b5d-4109-a188-d9b7e2659e42"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..7d58b962 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:36:33.295613Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5899da6f-b4ab-36ad-8bba-a1aeb9389adf"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5899da6f-b4ab-36ad-8bba-a1aeb9389adf"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3b2c3c7c-c12d-49b7-a047-a20066cf8995"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-04-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:36:33.295613+00:00, try_number=1, job_id=318, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-14 00:00:00+00:00 +INFO - Started process 2395 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-04-14T00:00:00+00:00', '--job-id', '318', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmptmxnzrjv'] +INFO - Job 318: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180414T000000, start_date=20221111T003633, end_date=20221111T003636 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-04-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:36:36.602006Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3b2c3c7c-c12d-49b7-a047-a20066cf8995"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..7764bdeb --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:36:33.212647Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5899da6f-b4ab-36ad-8bba-a1aeb9389adf"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5899da6f-b4ab-36ad-8bba-a1aeb9389adf"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3ca2069c-c659-4da8-aad7-aea6a51b00f4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-04-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:36:33.212647+00:00, try_number=1, job_id=317, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-14 00:00:00+00:00 +INFO - Started process 2393 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-04-14T00:00:00+00:00', '--job-id', '317', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmppbspx9c4'] +INFO - Job 317: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180414T000000, start_date=20221111T003633, end_date=20221111T003636 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-04-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:36:36.601573Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3ca2069c-c659-4da8-aad7-aea6a51b00f4"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..4f5b3b5c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:36:50.040639Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5899da6f-b4ab-36ad-8bba-a1aeb9389adf"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5899da6f-b4ab-36ad-8bba-a1aeb9389adf"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "63875aed-8025-462f-82ec-da52e3227c9f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-04-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:36:50.040639+00:00, try_number=1, job_id=322, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-14 00:00:00+00:00 +INFO - Started process 2409 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-04-14T00:00:00+00:00', '--job-id', '322', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpqgh0i95w'] +INFO - Job 322: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'WL5L7Z60E6izwc8htiXOLA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:WL5L7Z60E6izwc8htiXOLA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003651Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003651Z +20221111/us-east-1/s3/aws4_request +3f0b8f887a9dc8716ead9317149bc91c74272714d1c402f2fe6af9d8ffe3a014 +INFO - '2022-11-11' - botocore.auth - Signature: +ab678ae71fd4bbdfc39b8eb78d6dac838126719f6cb7f64d3cec390f3401f013 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'ikTET6oR0wMHa0OmbNR+0cnbYDCdL79qU9FfnxWyB4MtbLoYtfDjS4G7bKX0gj23gHJVBnE+z/A=', 'x-amz-request-id': '0AXH7MS3Z62E3W2P', 'Date': 'Fri, 11 Nov 2022 00:36:51 GMT', 'ETag': '"58be4bed9eb413a8b3c1cf21b625ce2c"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180414T000000, start_date=20221111T003650, end_date=20221111T003652 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-04-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:36:52.514724Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "63875aed-8025-462f-82ec-da52e3227c9f"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..6df4b1a6 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:36:46.048580Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5899da6f-b4ab-36ad-8bba-a1aeb9389adf"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5899da6f-b4ab-36ad-8bba-a1aeb9389adf"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fd93ffdc-f744-4420-873d-042d5b1b3389"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-04-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:36:46.048580+00:00, try_number=1, job_id=321, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-14 00:00:00+00:00 +INFO - Started process 2402 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-04-14T00:00:00+00:00', '--job-id', '321', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpdp__c15p'] +INFO - Job 321: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499521f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003647Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003647Z +20221111/us-east-1/s3/aws4_request +030cd4c0d1aed4f29ccecb04567f3ad1fb8ae0eed377e75c61d3a0a47324e123 +INFO - '2022-11-11' - botocore.auth - Signature: +8cccef180f93b05b71c484a027e86db4e1b2ebda6fc75698027d113b57478c29 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'Y7ppQSd0Ny6i5BNeVc2BwtRwOvXbD3yZOL6NXIojHXMhPzvqEcfz1qR5+g7DvpOmVOc49Vhr+Eg=', 'x-amz-request-id': 'JEC5QEBN1CM21FYC', 'Date': 'Fri, 11 Nov 2022 00:36:47 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180414T000000, start_date=20221111T003646, end_date=20221111T003648 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-04-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:36:48.644748Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fd93ffdc-f744-4420-873d-042d5b1b3389"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..7df2a383 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:36:38.576579Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5899da6f-b4ab-36ad-8bba-a1aeb9389adf"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5899da6f-b4ab-36ad-8bba-a1aeb9389adf"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6f004c47-b021-43b5-97e6-c18f2ad7a1cb"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-04-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:36:38.576579+00:00, try_number=1, job_id=319, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-14 00:00:00+00:00 +INFO - Started process 2412 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-04-14T00:00:00+00:00', '--job-id', '319', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpzs3jhsps'] +INFO - Job 319: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180414T000000, start_date=20221111T003638, end_date=20221111T003648 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-04-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:36:48.342526Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6f004c47-b021-43b5-97e6-c18f2ad7a1cb"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..a128b75c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:36:38.787008Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5899da6f-b4ab-36ad-8bba-a1aeb9389adf"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5899da6f-b4ab-36ad-8bba-a1aeb9389adf"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5e37f40e-b83d-4c7c-bfcd-0974e7ffda1c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-04-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:36:38.787008+00:00, try_number=1, job_id=320, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-14 00:00:00+00:00 +INFO - Started process 2415 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-04-14T00:00:00+00:00', '--job-id', '320', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmped5ugkwq'] +INFO - Job 320: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180414T000000, start_date=20221111T003638, end_date=20221111T003642 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-04-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:36:42.898353Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5e37f40e-b83d-4c7c-bfcd-0974e7ffda1c"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..17a879fe --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:36:55.827031Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6ce3b40c-a769-32ca-a0f4-0a699aceffcc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6ce3b40c-a769-32ca-a0f4-0a699aceffcc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ce99126f-8a10-4a84-a538-b093df0e3826"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-04-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:36:55.827031+00:00, try_number=1, job_id=323, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-15 00:00:00+00:00 +INFO - Started process 2478 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-04-15T00:00:00+00:00', '--job-id', '323', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpyour7_yh'] +INFO - Job 323: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180415T000000, start_date=20221111T003655, end_date=20221111T003659 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-04-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:36:59.683297Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ce99126f-8a10-4a84-a538-b093df0e3826"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..e52e8442 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:36:55.860166Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6ce3b40c-a769-32ca-a0f4-0a699aceffcc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6ce3b40c-a769-32ca-a0f4-0a699aceffcc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2908076a-9ee1-4491-928a-6e87851a7078"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-04-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:36:55.860166+00:00, try_number=1, job_id=324, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-15 00:00:00+00:00 +INFO - Started process 2480 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-04-15T00:00:00+00:00', '--job-id', '324', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp0ymjf0q4'] +INFO - Job 324: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180415T000000, start_date=20221111T003655, end_date=20221111T003659 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-04-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:36:59.692498Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2908076a-9ee1-4491-928a-6e87851a7078"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..314090b3 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:37:11.951598Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6ce3b40c-a769-32ca-a0f4-0a699aceffcc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6ce3b40c-a769-32ca-a0f4-0a699aceffcc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bce441f4-43f2-472a-9b4c-539d8674cfad"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-04-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:37:11.951598+00:00, try_number=1, job_id=328, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-15 00:00:00+00:00 +INFO - Started process 2511 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-04-15T00:00:00+00:00', '--job-id', '328', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpa3bctj2j'] +INFO - Job 328: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '6IN8cWTSqpn8CXjnFPTA2A==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:6IN8cWTSqpn8CXjnFPTA2A== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003713Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003713Z +20221111/us-east-1/s3/aws4_request +e1558554f461f6dee5daedace743ee0bd525222b524032862a4552d068cef404 +INFO - '2022-11-11' - botocore.auth - Signature: +d48f2e2b1db5d2ec356d342e47dfdb386de6f596ec0df6bdef559a61d90cc0f3 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'N7XSMeoxwSY/qMG3Ty8YVnLBN7lqLTqQGzhSkTAJoHbATBELajPbRR0MRMYRPVsk/YFIVlOgNqo=', 'x-amz-request-id': 'MVWGFC65D1X8CWHD', 'Date': 'Fri, 11 Nov 2022 00:37:13 GMT', 'ETag': '"e8837c7164d2aa99fc0978e714f4c0d8"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180415T000000, start_date=20221111T003711, end_date=20221111T003715 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-04-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:37:15.196578Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bce441f4-43f2-472a-9b4c-539d8674cfad"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..ac58725a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:37:07.165339Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6ce3b40c-a769-32ca-a0f4-0a699aceffcc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6ce3b40c-a769-32ca-a0f4-0a699aceffcc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1110152f-f526-4d1c-be96-3dcafe0ae44b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-04-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:37:07.165339+00:00, try_number=1, job_id=327, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-15 00:00:00+00:00 +INFO - Started process 2479 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-04-15T00:00:00+00:00', '--job-id', '327', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp1rnpnnik'] +INFO - Job 327: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499533a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003708Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003708Z +20221111/us-east-1/s3/aws4_request +ab567ff883916e8e926cfe3f682bf64b416a61188ac303989a03a2b8356fa6e1 +INFO - '2022-11-11' - botocore.auth - Signature: +9955f6534c3604c7bfb0d01f211348868a871ad244f267623d2de49ff8d6d60a +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'uTe0du3sS/h8ocZPdLOgVariF3u5dKzQj3cfURERxGPJpc+iOwBzKRRT2Pq1K31RHjXI4a0GY4Y=', 'x-amz-request-id': 'MJJ2X29H1WZ6DG9N', 'Date': 'Fri, 11 Nov 2022 00:37:09 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180415T000000, start_date=20221111T003707, end_date=20221111T003709 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-04-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:37:09.984765Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1110152f-f526-4d1c-be96-3dcafe0ae44b"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..85cb42b4 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:37:01.639789Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6ce3b40c-a769-32ca-a0f4-0a699aceffcc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6ce3b40c-a769-32ca-a0f4-0a699aceffcc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5e901991-e298-45ed-96c6-89483bd262fa"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-04-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:37:01.639789+00:00, try_number=1, job_id=325, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-15 00:00:00+00:00 +INFO - Started process 2487 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-04-15T00:00:00+00:00', '--job-id', '325', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpbegmj20j'] +INFO - Job 325: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180415T000000, start_date=20221111T003701, end_date=20221111T003709 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-04-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:37:09.744640Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5e901991-e298-45ed-96c6-89483bd262fa"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..0d2efa79 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:37:01.907810Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6ce3b40c-a769-32ca-a0f4-0a699aceffcc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6ce3b40c-a769-32ca-a0f4-0a699aceffcc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "dcdd343d-4c01-40d1-9b02-035ab7898279"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-04-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:37:01.907810+00:00, try_number=1, job_id=326, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-15 00:00:00+00:00 +INFO - Started process 2490 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-04-15T00:00:00+00:00', '--job-id', '326', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpc0jhwaxr'] +INFO - Job 326: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180415T000000, start_date=20221111T003701, end_date=20221111T003705 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-04-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:37:05.416659Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "dcdd343d-4c01-40d1-9b02-035ab7898279"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..911a2423 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:37:16.948870Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "805c02ab-fad9-3b7d-aa4d-b756e212e5a2"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "805c02ab-fad9-3b7d-aa4d-b756e212e5a2"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c66c8fdb-502d-4dd6-9814-1080adf3db0e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-04-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:37:16.948870+00:00, try_number=1, job_id=329, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-16 00:00:00+00:00 +INFO - Started process 2540 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-04-16T00:00:00+00:00', '--job-id', '329', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp8s7889ra'] +INFO - Job 329: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180416T000000, start_date=20221111T003716, end_date=20221111T003719 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-04-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:37:19.878253Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c66c8fdb-502d-4dd6-9814-1080adf3db0e"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..a243f00d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:37:16.994825Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "805c02ab-fad9-3b7d-aa4d-b756e212e5a2"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "805c02ab-fad9-3b7d-aa4d-b756e212e5a2"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "55b30e3c-a97c-4e75-916d-50b288087a77"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-04-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:37:16.994825+00:00, try_number=1, job_id=330, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-16 00:00:00+00:00 +INFO - Started process 2542 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-04-16T00:00:00+00:00', '--job-id', '330', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmphiorfeo7'] +INFO - Job 330: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180416T000000, start_date=20221111T003716, end_date=20221111T003721 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-04-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:37:21.324861Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "55b30e3c-a97c-4e75-916d-50b288087a77"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..41a4fc8f --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:37:29.456354Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "805c02ab-fad9-3b7d-aa4d-b756e212e5a2"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "805c02ab-fad9-3b7d-aa4d-b756e212e5a2"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2002d505-3b63-40de-b290-1155ec50f34b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-04-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:37:29.456354+00:00, try_number=1, job_id=334, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-16 00:00:00+00:00 +INFO - Started process 2488 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-04-16T00:00:00+00:00', '--job-id', '334', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmph8tr6bxi'] +INFO - Job 334: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498eff70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'WL5L7Z60E6izwc8htiXOLA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:WL5L7Z60E6izwc8htiXOLA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003730Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003730Z +20221111/us-east-1/s3/aws4_request +709890de7fc8a38427382db77b67c6b710faa5efea7a27bcb8a6a5f3e02345c2 +INFO - '2022-11-11' - botocore.auth - Signature: +bbd488a6f7e3ac19adde54440f349973cf460f06f76b8fa4022aad06ef873220 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'xLJXEWlzZLQXIqUjQrXnZsvouB8lpP1oJYVHsBBdOYozOh13DQ9+/fXoOclI11i7BcT35f/v1V8=', 'x-amz-request-id': 'PQHXYDC32DP5X2DV', 'Date': 'Fri, 11 Nov 2022 00:37:30 GMT', 'ETag': '"58be4bed9eb413a8b3c1cf21b625ce2c"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180416T000000, start_date=20221111T003729, end_date=20221111T003731 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-04-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:37:31.403446Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2002d505-3b63-40de-b290-1155ec50f34b"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..eba96c6a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:37:27.741578Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "805c02ab-fad9-3b7d-aa4d-b756e212e5a2"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "805c02ab-fad9-3b7d-aa4d-b756e212e5a2"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bdd9e70a-8c90-46a9-83ab-d0097d85dbe3"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-04-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:37:27.741578+00:00, try_number=1, job_id=333, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-16 00:00:00+00:00 +INFO - Started process 2588 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-04-16T00:00:00+00:00', '--job-id', '333', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp2jp0nrdr'] +INFO - Job 333: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003728Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003728Z +20221111/us-east-1/s3/aws4_request +a834c2f773339d5eb5358a165844ae0505c6011140050fa84e1a8fb88334eb50 +INFO - '2022-11-11' - botocore.auth - Signature: +f7c2d0fe4fe4f5a3653ebbb941c76f7bb76c6c22065fa131d60f26f72fd86b82 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'dSwO3M2j5fJWtpoY1oeLP5XvWpn4XCsjmhx2yu1UgeWpbS2ds8i/eJGpkuuw2xgGLFZO1hGnNz0=', 'x-amz-request-id': 'DG8W4SZNSQK69VVS', 'Date': 'Fri, 11 Nov 2022 00:37:29 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180416T000000, start_date=20221111T003727, end_date=20221111T003729 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-04-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:37:29.662392Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bdd9e70a-8c90-46a9-83ab-d0097d85dbe3"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..28f498be --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:37:21.504332Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "805c02ab-fad9-3b7d-aa4d-b756e212e5a2"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "805c02ab-fad9-3b7d-aa4d-b756e212e5a2"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1a6e0a8f-f658-4108-bcf2-ce16735cdc0a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-04-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:37:21.504332+00:00, try_number=1, job_id=331, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-16 00:00:00+00:00 +INFO - Started process 2554 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-04-16T00:00:00+00:00', '--job-id', '331', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpr7m0spmq'] +INFO - Job 331: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180416T000000, start_date=20221111T003721, end_date=20221111T003727 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-04-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:37:27.456490Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1a6e0a8f-f658-4108-bcf2-ce16735cdc0a"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..61e46833 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:37:22.969810Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "805c02ab-fad9-3b7d-aa4d-b756e212e5a2"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "805c02ab-fad9-3b7d-aa4d-b756e212e5a2"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "eb330a0e-86f6-48d3-bdc5-5adf8e860cad"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-04-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:37:22.969810+00:00, try_number=1, job_id=332, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-16 00:00:00+00:00 +INFO - Started process 2572 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-04-16T00:00:00+00:00', '--job-id', '332', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp4ook1arh'] +INFO - Job 332: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180416T000000, start_date=20221111T003722, end_date=20221111T003726 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-04-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:37:26.586014Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "eb330a0e-86f6-48d3-bdc5-5adf8e860cad"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..c6c144eb --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:37:33.357875Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "718e01dd-1884-32fe-82f8-866e07f2342d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "718e01dd-1884-32fe-82f8-866e07f2342d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9ceb1812-d2a6-4d81-8f29-4ae80cd5bfba"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-04-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:37:33.357875+00:00, try_number=1, job_id=336, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-17 00:00:00+00:00 +INFO - Started process 2599 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-04-17T00:00:00+00:00', '--job-id', '336', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp86ifz2cr'] +INFO - Job 336: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180417T000000, start_date=20221111T003733, end_date=20221111T003736 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-04-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:37:36.144531Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9ceb1812-d2a6-4d81-8f29-4ae80cd5bfba"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..37c34200 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:37:33.351104Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "718e01dd-1884-32fe-82f8-866e07f2342d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "718e01dd-1884-32fe-82f8-866e07f2342d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "032a9fad-cb4d-4b44-be89-d7d32a2e5c81"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-04-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:37:33.351104+00:00, try_number=1, job_id=335, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-17 00:00:00+00:00 +INFO - Started process 2597 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-04-17T00:00:00+00:00', '--job-id', '335', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp1s380lbe'] +INFO - Job 335: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180417T000000, start_date=20221111T003733, end_date=20221111T003736 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-04-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:37:36.123786Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "032a9fad-cb4d-4b44-be89-d7d32a2e5c81"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..4dee4e0b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:37:45.673185Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "718e01dd-1884-32fe-82f8-866e07f2342d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "718e01dd-1884-32fe-82f8-866e07f2342d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4471bf23-a04d-47e8-9f2a-6466e7468f2f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-04-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:37:45.673185+00:00, try_number=1, job_id=340, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-17 00:00:00+00:00 +INFO - Started process 2567 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-04-17T00:00:00+00:00', '--job-id', '340', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp0x7x84us'] +INFO - Job 340: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498ef940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'WL5L7Z60E6izwc8htiXOLA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:WL5L7Z60E6izwc8htiXOLA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003746Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003746Z +20221111/us-east-1/s3/aws4_request +67ae9df4aa427821d6c06c101f49ecab99d837a883afa82d35a00c6431a39f2c +INFO - '2022-11-11' - botocore.auth - Signature: +b656c53e3188806b17bc805baa13845fed4099f1fae0a363f4b57753d9925d3a +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'F9DEBXIgLEigPI2Ma+wkoFLKxQGgHowWR/sg/pQXPiZHjO6bpwJqmYVVXjXozb5KIeOmKmGMV8Y=', 'x-amz-request-id': 'NBNYMMRQ1D2CQVNB', 'Date': 'Fri, 11 Nov 2022 00:37:47 GMT', 'ETag': '"58be4bed9eb413a8b3c1cf21b625ce2c"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180417T000000, start_date=20221111T003745, end_date=20221111T003748 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-04-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:37:48.177946Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4471bf23-a04d-47e8-9f2a-6466e7468f2f"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..69477572 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:37:41.949016Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "718e01dd-1884-32fe-82f8-866e07f2342d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "718e01dd-1884-32fe-82f8-866e07f2342d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d7ff8cc1-6096-4a3e-91d0-b8d1d9a9555d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-04-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:37:41.949016+00:00, try_number=1, job_id=339, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-17 00:00:00+00:00 +INFO - Started process 2560 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-04-17T00:00:00+00:00', '--job-id', '339', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmps5t6voa5'] +INFO - Job 339: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499523a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003742Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003742Z +20221111/us-east-1/s3/aws4_request +b976124c04ae80c406165494a2d575fe5bea362d43ecb05b523abbb89024fb40 +INFO - '2022-11-11' - botocore.auth - Signature: +2d0ae445f4af35ed7740d4010f1430b086e2746ce2b56a921834ac5b3fa60320 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'i+lto2O80BGbXx+zb4riGz4DXWfPX2W94A0LU9hXg/fw6NfPC/pCdCOoTIciiWXlluc8OA8BVOU=', 'x-amz-request-id': 'K8G6NXXPWN5CHF10', 'Date': 'Fri, 11 Nov 2022 00:37:43 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180417T000000, start_date=20221111T003741, end_date=20221111T003744 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-04-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:37:44.216060Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d7ff8cc1-6096-4a3e-91d0-b8d1d9a9555d"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..0be14a5b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:37:37.527088Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "718e01dd-1884-32fe-82f8-866e07f2342d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "718e01dd-1884-32fe-82f8-866e07f2342d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8e0e0c3c-1ed4-4c9a-a47b-21ebd56d95d3"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-04-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:37:37.527088+00:00, try_number=1, job_id=338, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-17 00:00:00+00:00 +INFO - Started process 2609 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-04-17T00:00:00+00:00', '--job-id', '338', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpi8maghg8'] +INFO - Job 338: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180417T000000, start_date=20221111T003737, end_date=20221111T003742 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-04-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:37:42.370215Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8e0e0c3c-1ed4-4c9a-a47b-21ebd56d95d3"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..5e0081f0 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:37:37.497648Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "718e01dd-1884-32fe-82f8-866e07f2342d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "718e01dd-1884-32fe-82f8-866e07f2342d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "83da2c04-1a42-4761-8649-32a453cbdcf7"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-04-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:37:37.497648+00:00, try_number=1, job_id=337, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-17 00:00:00+00:00 +INFO - Started process 2607 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-04-17T00:00:00+00:00', '--job-id', '337', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp9bl1vurt'] +INFO - Job 337: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180417T000000, start_date=20221111T003737, end_date=20221111T003740 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-04-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:37:40.007905Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "83da2c04-1a42-4761-8649-32a453cbdcf7"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..4a8d8c00 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:37:50.471120Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "14563cd0-07cb-363b-b961-9181f8819aed"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "14563cd0-07cb-363b-b961-9181f8819aed"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "940e1a4f-15e4-497b-8707-7f553dd6d569"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-04-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:37:50.471120+00:00, try_number=1, job_id=342, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-18 00:00:00+00:00 +INFO - Started process 2578 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-04-18T00:00:00+00:00', '--job-id', '342', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpm0vry2w7'] +INFO - Job 342: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180418T000000, start_date=20221111T003750, end_date=20221111T003754 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-04-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:37:54.459136Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "940e1a4f-15e4-497b-8707-7f553dd6d569"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..d9ac66d2 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:37:50.468895Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "14563cd0-07cb-363b-b961-9181f8819aed"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "14563cd0-07cb-363b-b961-9181f8819aed"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fc51c953-b7a9-4d71-9513-4785724a41c9"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-04-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:37:50.468895+00:00, try_number=1, job_id=341, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-18 00:00:00+00:00 +INFO - Started process 2576 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-04-18T00:00:00+00:00', '--job-id', '341', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpc0p9vu6r'] +INFO - Job 341: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180418T000000, start_date=20221111T003750, end_date=20221111T003753 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-04-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:37:53.725560Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fc51c953-b7a9-4d71-9513-4785724a41c9"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..a911df5b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:38:03.073303Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "14563cd0-07cb-363b-b961-9181f8819aed"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "14563cd0-07cb-363b-b961-9181f8819aed"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e471a599-b216-496c-a271-a925b81e74e5"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-04-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:38:03.073303+00:00, try_number=1, job_id=346, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-18 00:00:00+00:00 +INFO - Started process 2609 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-04-18T00:00:00+00:00', '--job-id', '346', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpx1v3dbm8'] +INFO - Job 346: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'WL5L7Z60E6izwc8htiXOLA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:WL5L7Z60E6izwc8htiXOLA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003803Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003803Z +20221111/us-east-1/s3/aws4_request +107159d3eab9bbfb4789cfb015df42c7a762362707644b0c843e04bc0ec9764f +INFO - '2022-11-11' - botocore.auth - Signature: +23f39e0639869df49e6a70c7e4e986b46b4603475a031326b6d752dd67bc188a +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'SGmNX/S4LlaP7c9eiKJhwLn30A8m/I9zM14N8daYalrFJk/VbFvjOKpCef/ps4Qxyn1IDXPzRTg=', 'x-amz-request-id': 'M941W12NNFFPCP0Q', 'Date': 'Fri, 11 Nov 2022 00:38:04 GMT', 'ETag': '"58be4bed9eb413a8b3c1cf21b625ce2c"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180418T000000, start_date=20221111T003803, end_date=20221111T003805 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-04-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:38:05.111837Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e471a599-b216-496c-a271-a925b81e74e5"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..1b3aed4a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:38:00.965648Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "14563cd0-07cb-363b-b961-9181f8819aed"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "14563cd0-07cb-363b-b961-9181f8819aed"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6e0da1fb-6624-4e57-9c53-c95598b051ac"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-04-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:38:00.965648+00:00, try_number=1, job_id=345, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-18 00:00:00+00:00 +INFO - Started process 2690 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-04-18T00:00:00+00:00', '--job-id', '345', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpgdhqxc3n'] +INFO - Job 345: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003802Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003802Z +20221111/us-east-1/s3/aws4_request +3cd9fb20f0b7b707e2dc76d9ff5b4211d598937e21faf1766384ad54bac41bd4 +INFO - '2022-11-11' - botocore.auth - Signature: +f1a9a2e2d315bf860ba43902ebebf0f56dc18db69373818f1f88b090fe05aff2 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '8Hx8Ksah1IzebDTtc6UfPAxcJ4SkrKQ3jz9dqorA/BkzXKDW29Iz4pEvCbtm9yONlcV4pF1PsSk=', 'x-amz-request-id': '1GPM7F8VA9M4BG1F', 'Date': 'Fri, 11 Nov 2022 00:38:03 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180418T000000, start_date=20221111T003800, end_date=20221111T003804 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-04-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:38:04.044681Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6e0da1fb-6624-4e57-9c53-c95598b051ac"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..a44a095e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:37:55.883343Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "14563cd0-07cb-363b-b961-9181f8819aed"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "14563cd0-07cb-363b-b961-9181f8819aed"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "28262a38-2099-4a96-8fec-3b760367fc61"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-04-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:37:55.883343+00:00, try_number=1, job_id=344, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-18 00:00:00+00:00 +INFO - Started process 2684 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-04-18T00:00:00+00:00', '--job-id', '344', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpn4k3ed8a'] +INFO - Job 344: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180418T000000, start_date=20221111T003755, end_date=20221111T003800 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-04-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:38:00.388773Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "28262a38-2099-4a96-8fec-3b760367fc61"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..bf5e1483 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:37:55.887560Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "14563cd0-07cb-363b-b961-9181f8819aed"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "14563cd0-07cb-363b-b961-9181f8819aed"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0b7ac2bc-bca8-4ebf-a5ae-39c4d9ed7ab2"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-04-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:37:55.887560+00:00, try_number=1, job_id=343, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-18 00:00:00+00:00 +INFO - Started process 2683 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-04-18T00:00:00+00:00', '--job-id', '343', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpgd7otc29'] +INFO - Job 343: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180418T000000, start_date=20221111T003755, end_date=20221111T003758 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-04-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:37:58.836029Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0b7ac2bc-bca8-4ebf-a5ae-39c4d9ed7ab2"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..82266aab --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:38:07.465847Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a5d401d7-c2b5-390e-80d8-f1d76b142f30"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a5d401d7-c2b5-390e-80d8-f1d76b142f30"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f6364bd6-981c-4dd0-aa84-aca4831eef87"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-04-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:38:07.465847+00:00, try_number=1, job_id=348, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-19 00:00:00+00:00 +INFO - Started process 2655 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-04-19T00:00:00+00:00', '--job-id', '348', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpomx52i09'] +INFO - Job 348: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180419T000000, start_date=20221111T003807, end_date=20221111T003810 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-04-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:38:10.110487Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f6364bd6-981c-4dd0-aa84-aca4831eef87"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..5010a7b1 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:38:07.457494Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a5d401d7-c2b5-390e-80d8-f1d76b142f30"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a5d401d7-c2b5-390e-80d8-f1d76b142f30"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d655ce0d-188d-4036-960a-f3434f3c4159"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-04-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:38:07.457494+00:00, try_number=1, job_id=347, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-19 00:00:00+00:00 +INFO - Started process 2652 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-04-19T00:00:00+00:00', '--job-id', '347', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpzu5nsn_5'] +INFO - Job 347: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180419T000000, start_date=20221111T003807, end_date=20221111T003810 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-04-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:38:10.107272Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d655ce0d-188d-4036-960a-f3434f3c4159"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..4fdcad64 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:38:16.407302Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a5d401d7-c2b5-390e-80d8-f1d76b142f30"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a5d401d7-c2b5-390e-80d8-f1d76b142f30"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e11c68e2-08d2-461c-98c9-15e19bff466a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-04-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:38:16.407302+00:00, try_number=1, job_id=351, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-19 00:00:00+00:00 +INFO - Started process 2677 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-04-19T00:00:00+00:00', '--job-id', '351', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpj56h65g6'] +INFO - Job 351: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'uIiM0RJ6IyBInTwburV+og==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:uIiM0RJ6IyBInTwburV+og== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003817Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003817Z +20221111/us-east-1/s3/aws4_request +7777864713c61dd0efd96a65b0c6c94a0a7cd918d8ca13f8d47609abe15e1886 +INFO - '2022-11-11' - botocore.auth - Signature: +95d6e9d5f1d8f358434462ec4fcb52a223c0514be2048c1e87b5c73310a3479a +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'O7sF8rVogJ31KT/kzziliVao3w/DjZGrjw5KfRopIdke+rit/EnXwYVOB9bwL3YT6AttEx/jQq8=', 'x-amz-request-id': '6B3JDD2C7MDGVDKC', 'Date': 'Fri, 11 Nov 2022 00:38:18 GMT', 'ETag': '"b8888cd1127a2320489d3c1bbab57ea2"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180419T000000, start_date=20221111T003816, end_date=20221111T003818 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-04-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:38:18.951598Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e11c68e2-08d2-461c-98c9-15e19bff466a"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..1648a058 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:38:17.755396Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a5d401d7-c2b5-390e-80d8-f1d76b142f30"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a5d401d7-c2b5-390e-80d8-f1d76b142f30"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a8f19b85-23a1-4051-a84e-410e840ebc4e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-04-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:38:17.755396+00:00, try_number=1, job_id=352, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-19 00:00:00+00:00 +INFO - Started process 2682 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-04-19T00:00:00+00:00', '--job-id', '352', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp2qstyx3c'] +INFO - Job 352: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f1f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003818Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003818Z +20221111/us-east-1/s3/aws4_request +8ffe61b9fd77a9656d8401908fd509edd748f525074811126a6c1ba1cce052c7 +INFO - '2022-11-11' - botocore.auth - Signature: +397e5568647163a85679123ce9759d87370ee77b2cafc7ea628b1147449fdacb +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '4saMx59TbPmAcsQdm7f5sezp3AIE+J7ylMhybtRPazpwMnYBRT+4/YG149ZH7ps9P1Ew6d1QVtY=', 'x-amz-request-id': 'GZGMY02D4KA19FCV', 'Date': 'Fri, 11 Nov 2022 00:38:19 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180419T000000, start_date=20221111T003817, end_date=20221111T003819 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-04-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:38:19.869679Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a8f19b85-23a1-4051-a84e-410e840ebc4e"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..e54b4b68 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:38:11.426762Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a5d401d7-c2b5-390e-80d8-f1d76b142f30"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a5d401d7-c2b5-390e-80d8-f1d76b142f30"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c5dda684-0236-4891-919e-736567b84008"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-04-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:38:11.426762+00:00, try_number=1, job_id=349, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-19 00:00:00+00:00 +INFO - Started process 2668 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-04-19T00:00:00+00:00', '--job-id', '349', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpp4f4v6fm'] +INFO - Job 349: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180419T000000, start_date=20221111T003811, end_date=20221111T003814 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-04-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:38:14.940653Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c5dda684-0236-4891-919e-736567b84008"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..9cb5fa21 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:38:11.442474Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a5d401d7-c2b5-390e-80d8-f1d76b142f30"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a5d401d7-c2b5-390e-80d8-f1d76b142f30"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "33dc347c-525b-44a7-84ac-34c2aee9c84c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-04-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:38:11.442474+00:00, try_number=1, job_id=350, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-19 00:00:00+00:00 +INFO - Started process 2670 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-04-19T00:00:00+00:00', '--job-id', '350', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpupvg8pii'] +INFO - Job 350: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180419T000000, start_date=20221111T003811, end_date=20221111T003816 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-04-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:38:16.188692Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "33dc347c-525b-44a7-84ac-34c2aee9c84c"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..4baa283a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:38:21.412281Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "db529545-7eaa-34be-aa7e-455e13443cbd"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "db529545-7eaa-34be-aa7e-455e13443cbd"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d9b4acb8-8d9d-47df-a8f1-5bbbd0726cd1"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-04-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:38:21.412281+00:00, try_number=1, job_id=354, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-20 00:00:00+00:00 +INFO - Started process 2741 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-04-20T00:00:00+00:00', '--job-id', '354', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmph4zfa_3i'] +INFO - Job 354: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180420T000000, start_date=20221111T003821, end_date=20221111T003824 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-04-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:38:24.524902Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d9b4acb8-8d9d-47df-a8f1-5bbbd0726cd1"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..6b9e9563 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:38:21.404686Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "db529545-7eaa-34be-aa7e-455e13443cbd"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "db529545-7eaa-34be-aa7e-455e13443cbd"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "47d47443-59ae-4e2b-a778-bbf45d0b89bb"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-04-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:38:21.404686+00:00, try_number=1, job_id=353, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-20 00:00:00+00:00 +INFO - Started process 2740 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-04-20T00:00:00+00:00', '--job-id', '353', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpzv10krd1'] +INFO - Job 353: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180420T000000, start_date=20221111T003821, end_date=20221111T003824 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-04-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:38:24.530913Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "47d47443-59ae-4e2b-a778-bbf45d0b89bb"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..9f0fa7e0 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:38:31.923946Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "db529545-7eaa-34be-aa7e-455e13443cbd"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "db529545-7eaa-34be-aa7e-455e13443cbd"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "809c090a-8243-4d66-8466-d490b63fc5b5"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-04-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:38:31.923946+00:00, try_number=1, job_id=358, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-20 00:00:00+00:00 +INFO - Started process 2690 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-04-20T00:00:00+00:00', '--job-id', '358', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpw_5lo3sl'] +INFO - Job 358: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'uIiM0RJ6IyBInTwburV+og==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:uIiM0RJ6IyBInTwburV+og== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003832Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003832Z +20221111/us-east-1/s3/aws4_request +e5245236ce41cab80e8d1f9f4a2a99d99b2b1d469d11a91e97fc5c1dadcac056 +INFO - '2022-11-11' - botocore.auth - Signature: +fbbac4c83ef5004164c58b476bc0997e7604bd33d0ad574a8645373f4bea6654 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'T7nZ/xpdkOEyUKBbxOSzO7Z6AYliN0LIgQAiVI9EBR3KFs7Ib4wkEt7Wo7R+wRshmiEoxowtVxQ=', 'x-amz-request-id': 'SY2WNRQHGP199GMM', 'Date': 'Fri, 11 Nov 2022 00:38:33 GMT', 'ETag': '"b8888cd1127a2320489d3c1bbab57ea2"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180420T000000, start_date=20221111T003831, end_date=20221111T003833 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-04-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:38:33.869198Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "809c090a-8243-4d66-8466-d490b63fc5b5"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..1da907f1 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:38:30.528778Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "db529545-7eaa-34be-aa7e-455e13443cbd"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "db529545-7eaa-34be-aa7e-455e13443cbd"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ed86c0f0-7e5f-46e3-b1f3-8ede54da33ad"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-04-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:38:30.528778+00:00, try_number=1, job_id=357, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-20 00:00:00+00:00 +INFO - Started process 2782 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-04-20T00:00:00+00:00', '--job-id', '357', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpz77xo6db'] +INFO - Job 357: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa3f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003831Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003831Z +20221111/us-east-1/s3/aws4_request +a6869091f245b0ec2d997e3c0af8de475eae80dbefa354d874f69e90a3c7c263 +INFO - '2022-11-11' - botocore.auth - Signature: +2d413df7d51b0a556ec7487c964ed12140178a4f1ccc2f0039d2e8f68c20f2ca +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '4OgvYL1nfwgNE8KWuquGQOvlmz/D83YRiT0l3s4bd4ahXrtBvNsY0i/HFSVkYfDjY6cn+w6MrEc=', 'x-amz-request-id': '3K6270VXD2H8QR4E', 'Date': 'Fri, 11 Nov 2022 00:38:31 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180420T000000, start_date=20221111T003830, end_date=20221111T003832 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-04-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:38:32.313625Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ed86c0f0-7e5f-46e3-b1f3-8ede54da33ad"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..037dda58 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:38:26.075773Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "db529545-7eaa-34be-aa7e-455e13443cbd"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "db529545-7eaa-34be-aa7e-455e13443cbd"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3e9e356e-9c9e-4dc7-831d-06ba1718c5cc"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-04-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:38:26.075773+00:00, try_number=1, job_id=355, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-20 00:00:00+00:00 +INFO - Started process 2775 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-04-20T00:00:00+00:00', '--job-id', '355', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpp3t94e7m'] +INFO - Job 355: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180420T000000, start_date=20221111T003826, end_date=20221111T003830 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-04-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:38:30.393290Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3e9e356e-9c9e-4dc7-831d-06ba1718c5cc"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..3ddaae9d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:38:26.093721Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "db529545-7eaa-34be-aa7e-455e13443cbd"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "db529545-7eaa-34be-aa7e-455e13443cbd"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d937fe6f-7a29-4cca-9ac9-3cb238a8a964"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-04-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:38:26.093721+00:00, try_number=1, job_id=356, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-20 00:00:00+00:00 +INFO - Started process 2776 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-04-20T00:00:00+00:00', '--job-id', '356', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpot7qfvny'] +INFO - Job 356: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180420T000000, start_date=20221111T003826, end_date=20221111T003829 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-04-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:38:29.086198Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d937fe6f-7a29-4cca-9ac9-3cb238a8a964"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..1f6724eb --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:38:36.183361Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dcc77145-ab25-37b8-9322-548bc4caf35f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dcc77145-ab25-37b8-9322-548bc4caf35f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "85fcdf03-c679-46d7-b31c-a99a235ce0c3"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-04-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:38:36.183361+00:00, try_number=1, job_id=359, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-21 00:00:00+00:00 +INFO - Started process 2793 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-04-21T00:00:00+00:00', '--job-id', '359', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpw9jvjvr2'] +INFO - Job 359: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180421T000000, start_date=20221111T003836, end_date=20221111T003839 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-04-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:38:39.297327Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "85fcdf03-c679-46d7-b31c-a99a235ce0c3"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..a958789e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:38:36.185266Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dcc77145-ab25-37b8-9322-548bc4caf35f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dcc77145-ab25-37b8-9322-548bc4caf35f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5f5dd676-fc29-47d7-986a-ee8db5604dd4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-04-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:38:36.185266+00:00, try_number=1, job_id=360, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-21 00:00:00+00:00 +INFO - Started process 2791 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-04-21T00:00:00+00:00', '--job-id', '360', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpnl1ouzrj'] +INFO - Job 360: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180421T000000, start_date=20221111T003836, end_date=20221111T003839 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-04-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:38:39.302148Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5f5dd676-fc29-47d7-986a-ee8db5604dd4"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..d779d38a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:38:49.111723Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dcc77145-ab25-37b8-9322-548bc4caf35f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dcc77145-ab25-37b8-9322-548bc4caf35f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9abcdaee-a4ed-4433-aea4-d08d15775497"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-04-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:38:49.111723+00:00, try_number=1, job_id=364, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-21 00:00:00+00:00 +INFO - Started process 2849 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-04-21T00:00:00+00:00', '--job-id', '364', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpjykfau37'] +INFO - Job 364: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6ee0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'FYppOHVSXYFd3r0K9OySZw==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:FYppOHVSXYFd3r0K9OySZw== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003850Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003850Z +20221111/us-east-1/s3/aws4_request +c22ff0cdfe820b34b745710385b63927ca515f697470cc9616441d6967da0e83 +INFO - '2022-11-11' - botocore.auth - Signature: +f672aafab792941bd30b0321de3219f8bd70118f0f25a09c500f2320beeedaf7 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '6zd+nHXQHTTGTYeUfikcQgS8X9cxsWJg4fDF78+EAwHBsQNUx3v3vCLLGLyU2e64pIkgimQnfs4=', 'x-amz-request-id': 'KHFGR3D3JPXVMC0P', 'Date': 'Fri, 11 Nov 2022 00:38:50 GMT', 'ETag': '"158a693875525d815ddebd0af4ec9267"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180421T000000, start_date=20221111T003849, end_date=20221111T003851 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-04-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:38:51.527968Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9abcdaee-a4ed-4433-aea4-d08d15775497"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..9261dd74 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:38:46.135956Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dcc77145-ab25-37b8-9322-548bc4caf35f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dcc77145-ab25-37b8-9322-548bc4caf35f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "51d12f21-901d-4939-bdb8-7f854349a55f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-04-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:38:46.135956+00:00, try_number=1, job_id=363, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-21 00:00:00+00:00 +INFO - Started process 2826 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-04-21T00:00:00+00:00', '--job-id', '363', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp2lix15wb'] +INFO - Job 363: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50071f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003847Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003847Z +20221111/us-east-1/s3/aws4_request +441b42952f4f377ab32dcaedf19f48c603c612ed810cdfc3e24faae57aa9a47e +INFO - '2022-11-11' - botocore.auth - Signature: +190bd2d25f79023f209c49acce3c89564df7b58daf0e862527fb2741ad4a8804 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'Yuwa0arninuu4zovyZjV5nU6DQUuGNARo0KgOVBmriS0aLT2nVhHhBHsfg8RBv57EIuYyMC6/aM=', 'x-amz-request-id': 'VWCBFY4MSC0FCDQ2', 'Date': 'Fri, 11 Nov 2022 00:38:48 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180421T000000, start_date=20221111T003846, end_date=20221111T003848 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-04-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:38:48.900777Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "51d12f21-901d-4939-bdb8-7f854349a55f"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..8741d0c7 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:38:40.801987Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dcc77145-ab25-37b8-9322-548bc4caf35f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dcc77145-ab25-37b8-9322-548bc4caf35f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e7b7ee41-bad2-4efa-8f44-bacfa210cc74"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-04-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:38:40.801987+00:00, try_number=1, job_id=361, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-21 00:00:00+00:00 +INFO - Started process 2802 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-04-21T00:00:00+00:00', '--job-id', '361', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpf9ljbzl7'] +INFO - Job 361: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180421T000000, start_date=20221111T003840, end_date=20221111T003847 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-04-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:38:47.150535Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e7b7ee41-bad2-4efa-8f44-bacfa210cc74"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..ff24b27f --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:38:40.815186Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dcc77145-ab25-37b8-9322-548bc4caf35f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dcc77145-ab25-37b8-9322-548bc4caf35f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9c842a96-eac0-4635-a866-9bad5f76178c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-04-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:38:40.815186+00:00, try_number=1, job_id=362, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-21 00:00:00+00:00 +INFO - Started process 2803 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-04-21T00:00:00+00:00', '--job-id', '362', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp1tde04xe'] +INFO - Job 362: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180421T000000, start_date=20221111T003840, end_date=20221111T003843 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-04-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:38:43.627406Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9c842a96-eac0-4635-a866-9bad5f76178c"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..d40117c4 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:38:55.223890Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "936ce988-5917-314e-a5e0-89548b8ad721"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "936ce988-5917-314e-a5e0-89548b8ad721"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2756a9df-a114-4c91-8335-436dd1e28fd8"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-04-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:38:55.223890+00:00, try_number=1, job_id=366, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-22 00:00:00+00:00 +INFO - Started process 2766 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-04-22T00:00:00+00:00', '--job-id', '366', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpsf_4vjn0'] +INFO - Job 366: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180422T000000, start_date=20221111T003855, end_date=20221111T003900 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-04-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:39:00.534508Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2756a9df-a114-4c91-8335-436dd1e28fd8"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..539f0398 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:38:55.223392Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "936ce988-5917-314e-a5e0-89548b8ad721"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "936ce988-5917-314e-a5e0-89548b8ad721"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3174044f-4521-42b9-93fc-9636658ef642"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-04-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:38:55.223392+00:00, try_number=1, job_id=365, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-22 00:00:00+00:00 +INFO - Started process 2765 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-04-22T00:00:00+00:00', '--job-id', '365', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpglj_5hr1'] +INFO - Job 365: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180422T000000, start_date=20221111T003855, end_date=20221111T003900 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-04-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:39:00.482981Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3174044f-4521-42b9-93fc-9636658ef642"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..56679246 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:39:14.720515Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "936ce988-5917-314e-a5e0-89548b8ad721"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "936ce988-5917-314e-a5e0-89548b8ad721"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a65f971f-a866-4685-94cf-6bc0c5f42c3a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-04-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:39:14.720515+00:00, try_number=1, job_id=370, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-22 00:00:00+00:00 +INFO - Started process 2847 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-04-22T00:00:00+00:00', '--job-id', '370', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpabpi1nf6'] +INFO - Job 370: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0ee0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'ubHIMH5+nL74pCbTcc7KBw==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:ubHIMH5+nL74pCbTcc7KBw== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003915Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003915Z +20221111/us-east-1/s3/aws4_request +cf7c80c9d07d5933f2af58929ceb613aae2cccf350cf33848b6fc5629904aac8 +INFO - '2022-11-11' - botocore.auth - Signature: +8936117c1fee75d5f4b30f32bf31926d44d8b79ee21d02768c13a6eba2dfef3c +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '6zrESijmVtKFlJcXuv1ADpgMFM4tjjbF4GWMyY0lQJYMaMbRPwZEi8vBLyMnMu+N2DFfAJPw3Z4=', 'x-amz-request-id': 'FJMCMAZ6EF7VRZ4Z', 'Date': 'Fri, 11 Nov 2022 00:39:16 GMT', 'ETag': '"b9b1c8307e7e9cbef8a426d371ceca07"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180422T000000, start_date=20221111T003914, end_date=20221111T003916 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-04-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:39:16.823670Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a65f971f-a866-4685-94cf-6bc0c5f42c3a"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..75c1aeba --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:39:09.090724Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "936ce988-5917-314e-a5e0-89548b8ad721"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "936ce988-5917-314e-a5e0-89548b8ad721"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a39a344c-aef9-48ee-87b5-afa78f9aec0f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-04-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:39:09.090724+00:00, try_number=1, job_id=369, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-22 00:00:00+00:00 +INFO - Started process 2888 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-04-22T00:00:00+00:00', '--job-id', '369', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmptjnj_fyg'] +INFO - Job 369: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f5005550> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003910Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003910Z +20221111/us-east-1/s3/aws4_request +036a9c7feefc1a95c143ca7f9447a725895b84eb97f759cec8183ad4416ffc6d +INFO - '2022-11-11' - botocore.auth - Signature: +6ef5ba7b52b9390b181f9afeb89e2969d3e323d29c3acb81e87e66f68c1d315d +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'OHLlUBmkS5jGPqqH2S1MBpdxL2ksqW66HEBG0bno+hw/YhtcwxaPSY72pxZHnQyOjQJiKTxbR1s=', 'x-amz-request-id': 'FVTVSDGYPQ7AK2RV', 'Date': 'Fri, 11 Nov 2022 00:39:11 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180422T000000, start_date=20221111T003909, end_date=20221111T003911 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-04-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:39:11.841149Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a39a344c-aef9-48ee-87b5-afa78f9aec0f"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..5b12fe8d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:39:03.776828Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "936ce988-5917-314e-a5e0-89548b8ad721"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "936ce988-5917-314e-a5e0-89548b8ad721"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0d1247f2-ce9c-489f-92eb-5897f9456183"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-04-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:39:03.776828+00:00, try_number=1, job_id=368, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-22 00:00:00+00:00 +INFO - Started process 2799 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-04-22T00:00:00+00:00', '--job-id', '368', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpm6gahj5q'] +INFO - Job 368: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180422T000000, start_date=20221111T003903, end_date=20221111T003912 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-04-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:39:12.221606Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0d1247f2-ce9c-489f-92eb-5897f9456183"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..3fad4fef --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:39:03.618803Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "936ce988-5917-314e-a5e0-89548b8ad721"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "936ce988-5917-314e-a5e0-89548b8ad721"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a763eac8-1ad5-4a7b-85e8-9ed4e0897632"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-04-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:39:03.618803+00:00, try_number=1, job_id=367, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-22 00:00:00+00:00 +INFO - Started process 2790 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-04-22T00:00:00+00:00', '--job-id', '367', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpqpyd39wu'] +INFO - Job 367: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180422T000000, start_date=20221111T003903, end_date=20221111T003907 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-04-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:39:07.090995Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a763eac8-1ad5-4a7b-85e8-9ed4e0897632"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..94b12cdf --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:39:18.698653Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e3917dfa-cd30-356b-b3df-6ffd5344b3d5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e3917dfa-cd30-356b-b3df-6ffd5344b3d5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "26c94078-5859-4abe-9500-084dfd084b9f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-04-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:39:18.698653+00:00, try_number=1, job_id=372, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-23 00:00:00+00:00 +INFO - Started process 2922 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-04-23T00:00:00+00:00', '--job-id', '372', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpx3id5fq5'] +INFO - Job 372: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-23T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180423T000000, start_date=20221111T003918, end_date=20221111T003921 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-04-23T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:39:21.490152Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "26c94078-5859-4abe-9500-084dfd084b9f"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..6b08da26 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:39:18.697068Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e3917dfa-cd30-356b-b3df-6ffd5344b3d5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e3917dfa-cd30-356b-b3df-6ffd5344b3d5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9f027d79-ee2c-47d2-8d65-b813a9810b01"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-04-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:39:18.697068+00:00, try_number=1, job_id=371, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-23 00:00:00+00:00 +INFO - Started process 2924 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-04-23T00:00:00+00:00', '--job-id', '371', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpffezty1k'] +INFO - Job 371: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-23T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180423T000000, start_date=20221111T003918, end_date=20221111T003921 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-04-23T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:39:21.488788Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9f027d79-ee2c-47d2-8d65-b813a9810b01"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..fc4c4eec --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:39:31.425561Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e3917dfa-cd30-356b-b3df-6ffd5344b3d5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e3917dfa-cd30-356b-b3df-6ffd5344b3d5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e6693adb-f85b-48da-884a-77494a19f9c0"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-04-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:39:31.425561+00:00, try_number=1, job_id=376, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-23 00:00:00+00:00 +INFO - Started process 2871 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-04-23T00:00:00+00:00', '--job-id', '376', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpuqaqkhmt'] +INFO - Job 376: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-23T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'kjH8CpgFcp69EI+lSWvd2w==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:kjH8CpgFcp69EI+lSWvd2w== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003932Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003932Z +20221111/us-east-1/s3/aws4_request +a00a39d7cde1fb2164f27d49371ee366af132a1e63dc97be7cf29a5ff617d813 +INFO - '2022-11-11' - botocore.auth - Signature: +bf43b60c24c9013d36aba49634bfbd9b2f3bbdd68fb8b70ea75fca633784248f +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'fE0OhNT1CoGION4DU6qPiWIzp4cFrnWcMx5pYLZ8BuOCys3EgyP7vCzUWVNo/ZtMzPcnHyFQEcM=', 'x-amz-request-id': 'G6VMFXTDME5BNMN8', 'Date': 'Fri, 11 Nov 2022 00:39:32 GMT', 'ETag': '"9231fc0a9805729ebd108fa5496bdddb"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180423T000000, start_date=20221111T003931, end_date=20221111T003933 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-04-23T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:39:33.248358Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e6693adb-f85b-48da-884a-77494a19f9c0"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..ad357cb8 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:39:28.081120Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e3917dfa-cd30-356b-b3df-6ffd5344b3d5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e3917dfa-cd30-356b-b3df-6ffd5344b3d5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6e287610-e774-4004-aa64-3115b58f31af"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-04-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:39:28.081120+00:00, try_number=1, job_id=375, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-23 00:00:00+00:00 +INFO - Started process 2863 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-04-23T00:00:00+00:00', '--job-id', '375', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp_bsddqjz'] +INFO - Job 375: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-23T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499531f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003928Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003928Z +20221111/us-east-1/s3/aws4_request +93305ad71274f2400c23d78037979b79c0936014d1995b32540497190e96a676 +INFO - '2022-11-11' - botocore.auth - Signature: +bb6a8a1e8ae4ed3280f8ac9d792d684b5f9aa09f266dd97592b50ff51d2e2071 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'SnumUk8uvxJyVMQQ3hPkJ9mUi1qGE5KfCvE8DJNlWSEjYeKudmcbEr8NLXZO1OBN8SC7VL1qUnY=', 'x-amz-request-id': '4XSYRB1HWABW2MX3', 'Date': 'Fri, 11 Nov 2022 00:39:29 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180423T000000, start_date=20221111T003928, end_date=20221111T003930 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-04-23T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:39:30.141358Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6e287610-e774-4004-aa64-3115b58f31af"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..358994f0 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:39:23.319590Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e3917dfa-cd30-356b-b3df-6ffd5344b3d5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e3917dfa-cd30-356b-b3df-6ffd5344b3d5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "99ef3844-4b84-43ec-b25c-325908e851a7"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-04-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:39:23.319590+00:00, try_number=1, job_id=374, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-23 00:00:00+00:00 +INFO - Started process 2858 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-04-23T00:00:00+00:00', '--job-id', '374', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmplwzv9nmm'] +INFO - Job 374: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-23T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180423T000000, start_date=20221111T003923, end_date=20221111T003929 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-04-23T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:39:29.095454Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "99ef3844-4b84-43ec-b25c-325908e851a7"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..d4352940 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:39:23.136261Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e3917dfa-cd30-356b-b3df-6ffd5344b3d5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e3917dfa-cd30-356b-b3df-6ffd5344b3d5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "45c0dbd9-5f2e-459e-83be-2dabfa53b926"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-04-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:39:23.136261+00:00, try_number=1, job_id=373, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-23 00:00:00+00:00 +INFO - Started process 2856 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-04-23T00:00:00+00:00', '--job-id', '373', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp4gf39_7i'] +INFO - Job 373: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-23T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180423T000000, start_date=20221111T003923, end_date=20221111T003925 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-04-23T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:39:25.773262Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "45c0dbd9-5f2e-459e-83be-2dabfa53b926"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..f693c515 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:39:36.023774Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cb7d7689-264b-3f37-b69c-0f8b8b39b5dc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cb7d7689-264b-3f37-b69c-0f8b8b39b5dc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d43f58c9-39b4-4f7d-a5b9-87220fe04248"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-04-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:39:36.023774+00:00, try_number=1, job_id=378, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-24 00:00:00+00:00 +INFO - Started process 2922 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-04-24T00:00:00+00:00', '--job-id', '378', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpo7x5rqqs'] +INFO - Job 378: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-24T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180424T000000, start_date=20221111T003936, end_date=20221111T003938 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-04-24T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:39:38.994256Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d43f58c9-39b4-4f7d-a5b9-87220fe04248"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..bc6802c5 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:39:36.020081Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cb7d7689-264b-3f37-b69c-0f8b8b39b5dc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cb7d7689-264b-3f37-b69c-0f8b8b39b5dc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1fcdb416-f266-4291-8d9c-e87d1a82c936"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-04-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:39:36.020081+00:00, try_number=1, job_id=377, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-24 00:00:00+00:00 +INFO - Started process 2921 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-04-24T00:00:00+00:00', '--job-id', '377', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpwlnxjkmm'] +INFO - Job 377: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-24T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180424T000000, start_date=20221111T003936, end_date=20221111T003939 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-04-24T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:39:39.048546Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1fcdb416-f266-4291-8d9c-e87d1a82c936"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..8565464c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:39:48.750207Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cb7d7689-264b-3f37-b69c-0f8b8b39b5dc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cb7d7689-264b-3f37-b69c-0f8b8b39b5dc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "49426115-b385-4e17-98bd-026805375350"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-04-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:39:48.750207+00:00, try_number=1, job_id=382, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-24 00:00:00+00:00 +INFO - Started process 3005 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-04-24T00:00:00+00:00', '--job-id', '382', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp2ovyaxxp'] +INFO - Job 382: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-24T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '1xskdkruI+0lk13rDwWtqA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:1xskdkruI+0lk13rDwWtqA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003949Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003949Z +20221111/us-east-1/s3/aws4_request +961dd833ae5c7ba8ebc6ea0d4a8d3fbaa3acc448a78b55b74b5f279f80212575 +INFO - '2022-11-11' - botocore.auth - Signature: +ccdb01d7792943a4143f81772f562bbb4b20bb2ae3337635438212775431d675 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'zdCixmhjDNZCQeEAtO5Ff+9IcSOYrbswtTqyA4XrsUlNDF41RtsJJOARKOAPVUAbcXzcbZ9oKWE=', 'x-amz-request-id': '4TV9S2PH6Q39B600', 'Date': 'Fri, 11 Nov 2022 00:39:49 GMT', 'ETag': '"d71b24764aee23ed25935deb0f05ada8"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180424T000000, start_date=20221111T003948, end_date=20221111T003950 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-04-24T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:39:50.596022Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "49426115-b385-4e17-98bd-026805375350"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..2a3d2fbc --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:39:45.956554Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cb7d7689-264b-3f37-b69c-0f8b8b39b5dc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cb7d7689-264b-3f37-b69c-0f8b8b39b5dc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "add5a7d9-49a0-45ff-bbe4-bad8a9d83d6c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-04-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:39:45.956554+00:00, try_number=1, job_id=381, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-24 00:00:00+00:00 +INFO - Started process 2951 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-04-24T00:00:00+00:00', '--job-id', '381', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpswpmwks1'] +INFO - Job 381: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-24T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499523a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T003947Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T003947Z +20221111/us-east-1/s3/aws4_request +b1252c059e986d773042ad6422525102b53059cabe266e9a102cc079e0359191 +INFO - '2022-11-11' - botocore.auth - Signature: +78a9e67f517f7725f80a183a86eede386cda1a9e0bb130ed9f1353dca36532dd +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'B7yl6gyshKuCm0wNHTgbm+yFnA5osZL7ePm7u45ElzYu1qomkrF+pm5Y8badM0iDM0/IzLAyjJQ=', 'x-amz-request-id': 'VJ4FPNVX1A9XKCVS', 'Date': 'Fri, 11 Nov 2022 00:39:47 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180424T000000, start_date=20221111T003945, end_date=20221111T003948 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-04-24T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:39:48.451424Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "add5a7d9-49a0-45ff-bbe4-bad8a9d83d6c"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..86533c44 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:39:40.946968Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cb7d7689-264b-3f37-b69c-0f8b8b39b5dc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cb7d7689-264b-3f37-b69c-0f8b8b39b5dc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cd37a571-1b80-4cd8-974a-94c63d0ed061"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-04-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:39:40.946968+00:00, try_number=1, job_id=379, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-24 00:00:00+00:00 +INFO - Started process 2973 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-04-24T00:00:00+00:00', '--job-id', '379', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpmpp1tt6d'] +INFO - Job 379: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-24T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180424T000000, start_date=20221111T003940, end_date=20221111T003947 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-04-24T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:39:47.275740Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cd37a571-1b80-4cd8-974a-94c63d0ed061"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..443ab48a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:39:40.971819Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cb7d7689-264b-3f37-b69c-0f8b8b39b5dc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cb7d7689-264b-3f37-b69c-0f8b8b39b5dc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "14fc0bb5-fdea-478f-b9d5-da24466370f8"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-04-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:39:40.971819+00:00, try_number=1, job_id=380, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-24 00:00:00+00:00 +INFO - Started process 2974 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-04-24T00:00:00+00:00', '--job-id', '380', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpdm1ja6d8'] +INFO - Job 380: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-24T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180424T000000, start_date=20221111T003940, end_date=20221111T003943 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-04-24T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:39:43.857505Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "14fc0bb5-fdea-478f-b9d5-da24466370f8"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..310f34ba --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:39:53.290698Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "726d7602-0fe4-3252-a711-034ec0d5376c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "726d7602-0fe4-3252-a711-034ec0d5376c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2d051733-b268-4349-9efa-9c4e732d13d6"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-04-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:39:53.290698+00:00, try_number=1, job_id=384, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-25 00:00:00+00:00 +INFO - Started process 3021 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-04-25T00:00:00+00:00', '--job-id', '384', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmphtmyqjgz'] +INFO - Job 384: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-25T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180425T000000, start_date=20221111T003953, end_date=20221111T003956 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-04-25T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:39:56.553023Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2d051733-b268-4349-9efa-9c4e732d13d6"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..304dbe18 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:39:52.826139Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "726d7602-0fe4-3252-a711-034ec0d5376c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "726d7602-0fe4-3252-a711-034ec0d5376c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d712a567-0364-4e7e-8b4a-ca61c3314456"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-04-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:39:52.826139+00:00, try_number=1, job_id=383, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-25 00:00:00+00:00 +INFO - Started process 3018 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-04-25T00:00:00+00:00', '--job-id', '383', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpwia2napf'] +INFO - Job 383: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-25T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180425T000000, start_date=20221111T003952, end_date=20221111T003956 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-04-25T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:39:56.006666Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d712a567-0364-4e7e-8b4a-ca61c3314456"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..4c092b89 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:40:13.718881Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "726d7602-0fe4-3252-a711-034ec0d5376c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "726d7602-0fe4-3252-a711-034ec0d5376c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b2993d38-b19f-4c52-97f0-9943e6b53381"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-04-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:40:13.718881+00:00, try_number=1, job_id=388, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-25 00:00:00+00:00 +INFO - Started process 3039 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-04-25T00:00:00+00:00', '--job-id', '388', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpm1b727yl'] +INFO - Job 388: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-25T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6ee0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '1xskdkruI+0lk13rDwWtqA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:1xskdkruI+0lk13rDwWtqA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004015Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004015Z +20221111/us-east-1/s3/aws4_request +ab8bcc7ce298e0a7e64123adc6761e59138eb62d05a4dde21310f6d1945bab5c +INFO - '2022-11-11' - botocore.auth - Signature: +0e9bd99059575768048665d2cb65498ece9e0cf14ff67a85ef4c17649f5f60ed +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '9LrA2aMu/yf3WFINMRcNvrjgpJALFNDVgfJbhTqiZqWVbCcxZ5xBSKcfAANIYwXrXINmPAK726k=', 'x-amz-request-id': '2AXH7SW3KNN2VPR2', 'Date': 'Fri, 11 Nov 2022 00:40:15 GMT', 'ETag': '"d71b24764aee23ed25935deb0f05ada8"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180425T000000, start_date=20221111T004013, end_date=20221111T004016 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-04-25T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:40:16.760369Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b2993d38-b19f-4c52-97f0-9943e6b53381"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..b1699c1a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:40:04.077367Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "726d7602-0fe4-3252-a711-034ec0d5376c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "726d7602-0fe4-3252-a711-034ec0d5376c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "18013a99-99bd-4f0d-9d6f-51c1bcef7168"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-04-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:40:04.077367+00:00, try_number=1, job_id=387, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-25 00:00:00+00:00 +INFO - Started process 3032 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-04-25T00:00:00+00:00', '--job-id', '387', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpy_em3kdq'] +INFO - Job 387: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-25T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50083a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004006Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004006Z +20221111/us-east-1/s3/aws4_request +fb18b42c0b8c8879f1a43822af9897cb40921a3cf0bcca060d734d857fb16f32 +INFO - '2022-11-11' - botocore.auth - Signature: +b7c5ff279489e115451f8b3e20bea58e1942880e40442326fe545385403b46e5 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '9PaHhyY83zRxFZkgnjlLsF8TdXG2fRvwUyQLzjoMWK3RD3wxE2CKsPosyaUbnzTWb6h1ArYZPSuLy5kmUOwd7w==', 'x-amz-request-id': 'KC5V5APBE49TYE5A', 'Date': 'Fri, 11 Nov 2022 00:40:06 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180425T000000, start_date=20221111T004004, end_date=20221111T004007 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-04-25T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:40:07.566905Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "18013a99-99bd-4f0d-9d6f-51c1bcef7168"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..cc3e80ed --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:39:59.669567Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "726d7602-0fe4-3252-a711-034ec0d5376c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "726d7602-0fe4-3252-a711-034ec0d5376c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f55e0d95-9dc1-48e2-83f2-b1246930a18a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-04-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:39:59.669567+00:00, try_number=1, job_id=386, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-25 00:00:00+00:00 +INFO - Started process 2960 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-04-25T00:00:00+00:00', '--job-id', '386', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpg5z7z4if'] +INFO - Job 386: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-25T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180425T000000, start_date=20221111T003959, end_date=20221111T004010 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-04-25T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:40:10.865471Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f55e0d95-9dc1-48e2-83f2-b1246930a18a"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..4613086d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:39:57.945995Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "726d7602-0fe4-3252-a711-034ec0d5376c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "726d7602-0fe4-3252-a711-034ec0d5376c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ef9ebd19-6be5-4169-bda1-916b283dd1ca"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-04-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:39:57.945995+00:00, try_number=1, job_id=385, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-25 00:00:00+00:00 +INFO - Started process 3027 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-04-25T00:00:00+00:00', '--job-id', '385', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpn_37cq6x'] +INFO - Job 385: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-25T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180425T000000, start_date=20221111T003957, end_date=20221111T004001 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-04-25T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:40:01.136193Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ef9ebd19-6be5-4169-bda1-916b283dd1ca"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..a1a49222 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:40:20.443447Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2d66295e-8553-302c-aed9-e5cc4d20410c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2d66295e-8553-302c-aed9-e5cc4d20410c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3c8ed0ee-ede4-4147-8be9-20673115f2a4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-04-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:40:20.443447+00:00, try_number=1, job_id=389, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-26 00:00:00+00:00 +INFO - Started process 3021 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-04-26T00:00:00+00:00', '--job-id', '389', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpw962kc37'] +INFO - Job 389: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-26T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180426T000000, start_date=20221111T004020, end_date=20221111T004023 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-04-26T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:40:23.513312Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3c8ed0ee-ede4-4147-8be9-20673115f2a4"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..19105ce1 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:40:20.571627Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2d66295e-8553-302c-aed9-e5cc4d20410c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2d66295e-8553-302c-aed9-e5cc4d20410c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c8dc6b51-3b2f-4415-9f4f-2d374392e8c7"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-04-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:40:20.571627+00:00, try_number=1, job_id=390, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-26 00:00:00+00:00 +INFO - Started process 3024 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-04-26T00:00:00+00:00', '--job-id', '390', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpgof71jai'] +INFO - Job 390: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-26T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180426T000000, start_date=20221111T004020, end_date=20221111T004023 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-04-26T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:40:23.506386Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c8dc6b51-3b2f-4415-9f4f-2d374392e8c7"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..4f5ea0ca --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:40:37.424011Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2d66295e-8553-302c-aed9-e5cc4d20410c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2d66295e-8553-302c-aed9-e5cc4d20410c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ba6989fc-3cea-4c34-9d77-051e6d37f739"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-04-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:40:37.424011+00:00, try_number=1, job_id=394, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-26 00:00:00+00:00 +INFO - Started process 3083 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-04-26T00:00:00+00:00', '--job-id', '394', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmppdanivfn'] +INFO - Job 394: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-26T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'f5nASCegarfvSBHZ4HIH7A==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:f5nASCegarfvSBHZ4HIH7A== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004038Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004038Z +20221111/us-east-1/s3/aws4_request +87305d012dfcb62317347d32731a465d1c75e8dd08b04a0c8fc701e49be1f180 +INFO - '2022-11-11' - botocore.auth - Signature: +53d40b2f0c4ea59a278a73acbf0490579ef95b7329ccd1f4dfc309bee31c3808 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'Puk5gCSD7JZoztme8DLPGHfPTQQK3s2I8jik7QNSK5jm8anuyVuYXIC+uQHsFIFvHcbXIE/d7I8=', 'x-amz-request-id': 'YR003942RAKBGWFW', 'Date': 'Fri, 11 Nov 2022 00:40:38 GMT', 'ETag': '"7f99c04827a06ab7ef4811d9e07207ec"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180426T000000, start_date=20221111T004037, end_date=20221111T004039 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-04-26T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:40:39.374067Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ba6989fc-3cea-4c34-9d77-051e6d37f739"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..39fc3ea3 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:40:32.870963Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2d66295e-8553-302c-aed9-e5cc4d20410c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2d66295e-8553-302c-aed9-e5cc4d20410c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3491ec6f-1889-4177-956b-11a74d3a12af"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-04-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:40:32.870963+00:00, try_number=1, job_id=393, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-26 00:00:00+00:00 +INFO - Started process 3120 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-04-26T00:00:00+00:00', '--job-id', '393', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmprvaa1d9n'] +INFO - Job 393: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-26T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50041f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004034Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004034Z +20221111/us-east-1/s3/aws4_request +b79cf31234a1fd439f1e94efcbf39b40c8636203ed0e7d8efc6cc5c090dfdb9c +INFO - '2022-11-11' - botocore.auth - Signature: +f9d1eb4a08f13e4e4e9545753fc1f36b5b42cd86255b3f7d21520b7f0edb7a68 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'fKSpVTDiIE+BoViUD3rVds1D49lr5xzrNag2sz/Gsrl24nCbx7rOtk4RfL7c0u3kx31dLNOsW/o=', 'x-amz-request-id': '3F0SV1WF61ECXAX5', 'Date': 'Fri, 11 Nov 2022 00:40:34 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180426T000000, start_date=20221111T004032, end_date=20221111T004035 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-04-26T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:40:35.705910Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3491ec6f-1889-4177-956b-11a74d3a12af"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..60ac45ba --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:40:26.956866Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2d66295e-8553-302c-aed9-e5cc4d20410c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2d66295e-8553-302c-aed9-e5cc4d20410c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d85b7b18-ff08-4234-8ab8-8f1f851ddd95"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-04-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:40:26.956866+00:00, try_number=1, job_id=392, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-26 00:00:00+00:00 +INFO - Started process 3115 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-04-26T00:00:00+00:00', '--job-id', '392', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpbsglozdf'] +INFO - Job 392: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-26T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180426T000000, start_date=20221111T004026, end_date=20221111T004034 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-04-26T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:40:34.957006Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d85b7b18-ff08-4234-8ab8-8f1f851ddd95"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..e954b513 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:40:26.929116Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2d66295e-8553-302c-aed9-e5cc4d20410c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2d66295e-8553-302c-aed9-e5cc4d20410c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ee5a2931-88c4-4301-84d3-fa6da5b3ad76"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-04-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:40:26.929116+00:00, try_number=1, job_id=391, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-26 00:00:00+00:00 +INFO - Started process 3114 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-04-26T00:00:00+00:00', '--job-id', '391', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpcz142but'] +INFO - Job 391: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-26T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180426T000000, start_date=20221111T004026, end_date=20221111T004030 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-04-26T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:40:30.079889Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ee5a2931-88c4-4301-84d3-fa6da5b3ad76"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..49557cea --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:40:42.157901Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c05cb8ba-1c0f-3ad5-ac74-bd2cffd53e21"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c05cb8ba-1c0f-3ad5-ac74-bd2cffd53e21"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "490064cb-c193-4c8d-a2d5-62e93ae0c155"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-04-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:40:42.157901+00:00, try_number=1, job_id=395, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-27 00:00:00+00:00 +INFO - Started process 3130 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-04-27T00:00:00+00:00', '--job-id', '395', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpo4wcl7z7'] +INFO - Job 395: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-27T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180427T000000, start_date=20221111T004042, end_date=20221111T004045 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-04-27T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:40:45.066278Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "490064cb-c193-4c8d-a2d5-62e93ae0c155"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..47fe033b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:40:42.184177Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c05cb8ba-1c0f-3ad5-ac74-bd2cffd53e21"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c05cb8ba-1c0f-3ad5-ac74-bd2cffd53e21"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e08b685e-5d56-4b54-810a-7686b63305fa"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-04-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:40:42.184177+00:00, try_number=1, job_id=396, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-27 00:00:00+00:00 +INFO - Started process 3132 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-04-27T00:00:00+00:00', '--job-id', '396', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp8eupdc7n'] +INFO - Job 396: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-27T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180427T000000, start_date=20221111T004042, end_date=20221111T004045 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-04-27T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:40:45.109916Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e08b685e-5d56-4b54-810a-7686b63305fa"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..591357a0 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:40:55.772560Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c05cb8ba-1c0f-3ad5-ac74-bd2cffd53e21"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c05cb8ba-1c0f-3ad5-ac74-bd2cffd53e21"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "61d04a29-6345-4f3d-b886-a827beffc7d4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-04-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:40:55.772560+00:00, try_number=1, job_id=400, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-27 00:00:00+00:00 +INFO - Started process 3102 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-04-27T00:00:00+00:00', '--job-id', '400', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpwysr7q_l'] +INFO - Job 400: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-27T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498eff70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'lhZMlf+6PsR3aKThiNRMqQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:lhZMlf+6PsR3aKThiNRMqQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004056Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004056Z +20221111/us-east-1/s3/aws4_request +4f0fb9a4a1d640680ac2e3154d7be7fd1821a6579454992f59eb957d70621b56 +INFO - '2022-11-11' - botocore.auth - Signature: +eb3c86c74b340cd39a7d5039b82c990a97c458a4d033c13bd50b4b0c913bec5d +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '8/bXtB8Ovd9uRHTiNDGyyD9BHiakAxa8k42Xu8xd/kieCZFN9rSqT53u+rZ1HNEjO9CCU9rDo+k=', 'x-amz-request-id': 'PCWSHRBS45F6QXW5', 'Date': 'Fri, 11 Nov 2022 00:40:56 GMT', 'ETag': '"96164c95ffba3ec47768a4e188d44ca9"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180427T000000, start_date=20221111T004055, end_date=20221111T004057 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-04-27T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:40:57.595578Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "61d04a29-6345-4f3d-b886-a827beffc7d4"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..c8eae377 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:40:52.417250Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c05cb8ba-1c0f-3ad5-ac74-bd2cffd53e21"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c05cb8ba-1c0f-3ad5-ac74-bd2cffd53e21"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ec2469ce-0544-42f0-a807-a5aa6c4c964b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-04-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:40:52.417250+00:00, try_number=1, job_id=399, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-27 00:00:00+00:00 +INFO - Started process 3203 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-04-27T00:00:00+00:00', '--job-id', '399', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpbgdu7yq5'] +INFO - Job 399: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-27T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50043a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004053Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004053Z +20221111/us-east-1/s3/aws4_request +64ad42fa9f3a39b6e251f8cc6be4189872513307e7c89dda6ec527915f36ece5 +INFO - '2022-11-11' - botocore.auth - Signature: +b57644342afd8f448fd1313a4ce331b778d25384e1a4a616d7d77b44ac980e3a +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'aLod7ruSZAIt5r53EPt3GctmkC5BGv16eFmZom0D6XUqXudRUUj+ldWSDqiCYQi5OxRBsyGnOHc=', 'x-amz-request-id': 'MJXWDSMMMPF3XW30', 'Date': 'Fri, 11 Nov 2022 00:40:53 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180427T000000, start_date=20221111T004052, end_date=20221111T004054 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-04-27T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:40:54.476349Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ec2469ce-0544-42f0-a807-a5aa6c4c964b"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..f0bd73a8 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:40:47.270067Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c05cb8ba-1c0f-3ad5-ac74-bd2cffd53e21"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c05cb8ba-1c0f-3ad5-ac74-bd2cffd53e21"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c9adbc3b-6c73-4bfb-8631-23d5dd78e576"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-04-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:40:47.270067+00:00, try_number=1, job_id=398, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-27 00:00:00+00:00 +INFO - Started process 3095 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-04-27T00:00:00+00:00', '--job-id', '398', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmptsl_79ti'] +INFO - Job 398: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-27T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180427T000000, start_date=20221111T004047, end_date=20221111T004054 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-04-27T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:40:54.042141Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c9adbc3b-6c73-4bfb-8631-23d5dd78e576"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..be810e1a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:40:47.268765Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c05cb8ba-1c0f-3ad5-ac74-bd2cffd53e21"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c05cb8ba-1c0f-3ad5-ac74-bd2cffd53e21"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b60061b1-9965-4fd7-bf02-9328a7f856ac"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-04-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:40:47.268765+00:00, try_number=1, job_id=397, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-27 00:00:00+00:00 +INFO - Started process 3096 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-04-27T00:00:00+00:00', '--job-id', '397', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmprn888o1b'] +INFO - Job 397: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-27T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180427T000000, start_date=20221111T004047, end_date=20221111T004050 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-04-27T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:40:50.160067Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b60061b1-9965-4fd7-bf02-9328a7f856ac"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..858b7ffd --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:40:59.442596Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d96397de-af6d-3f2e-ab46-a0ff4bccbd69"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d96397de-af6d-3f2e-ab46-a0ff4bccbd69"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d15dc248-24fb-43a3-85b8-c524c0b1e9e3"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-04-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:40:59.442596+00:00, try_number=1, job_id=401, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-28 00:00:00+00:00 +INFO - Started process 3212 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-04-28T00:00:00+00:00', '--job-id', '401', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpfnete812'] +INFO - Job 401: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-28T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180428T000000, start_date=20221111T004059, end_date=20221111T004102 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-04-28T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:41:02.539433Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d15dc248-24fb-43a3-85b8-c524c0b1e9e3"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..fec00bdb --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:40:59.491742Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d96397de-af6d-3f2e-ab46-a0ff4bccbd69"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d96397de-af6d-3f2e-ab46-a0ff4bccbd69"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "24fc4bed-ea06-455f-99a0-785bc7514f85"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-04-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:40:59.491742+00:00, try_number=1, job_id=402, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-28 00:00:00+00:00 +INFO - Started process 3214 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-04-28T00:00:00+00:00', '--job-id', '402', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp8j6yxqq_'] +INFO - Job 402: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-28T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180428T000000, start_date=20221111T004059, end_date=20221111T004102 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-04-28T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:41:02.578383Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "24fc4bed-ea06-455f-99a0-785bc7514f85"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..e4a92dd8 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:41:13.106796Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d96397de-af6d-3f2e-ab46-a0ff4bccbd69"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d96397de-af6d-3f2e-ab46-a0ff4bccbd69"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e26cb132-b7b6-43f5-8dad-a5d3d668fbef"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-04-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:41:13.106796+00:00, try_number=1, job_id=406, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-28 00:00:00+00:00 +INFO - Started process 3230 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-04-28T00:00:00+00:00', '--job-id', '406', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp6xbl8as9'] +INFO - Job 406: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-28T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'Onewa3j76dTOgiCgbPXaRQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:Onewa3j76dTOgiCgbPXaRQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004113Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004113Z +20221111/us-east-1/s3/aws4_request +c54b760f15e659b15520580e3f6033906952cb6dd8a2b131ddbf865bcc799136 +INFO - '2022-11-11' - botocore.auth - Signature: +d45ed9fa61fb01b9feb414ae477f5ad1900bab48ade5b0e24304e95d7633add6 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'u01EDkOCJ1/FmAuGUH5m4lc+GxxNGIZsRFPnCKLm9xRIfLNKODolVC+u3iLf/2DPJqMZ6m9lXbw=', 'x-amz-request-id': '93DBPHB3SGFZZ0M3', 'Date': 'Fri, 11 Nov 2022 00:41:14 GMT', 'ETag': '"3a77b06b78fbe9d4ce8220a06cf5da45"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180428T000000, start_date=20221111T004113, end_date=20221111T004115 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-04-28T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:41:15.016223Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e26cb132-b7b6-43f5-8dad-a5d3d668fbef"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..499f6486 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:41:10.179443Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d96397de-af6d-3f2e-ab46-a0ff4bccbd69"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d96397de-af6d-3f2e-ab46-a0ff4bccbd69"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "883c7830-b2f2-497e-b395-2ce9fcbc85bb"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-04-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:41:10.179443+00:00, try_number=1, job_id=405, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-28 00:00:00+00:00 +INFO - Started process 3174 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-04-28T00:00:00+00:00', '--job-id', '405', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmphvn32z21'] +INFO - Job 405: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-28T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499521f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004111Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004111Z +20221111/us-east-1/s3/aws4_request +098f3f1e784ae8e1c199d431e981a7a68a4b57240f726aeadedb8d731ca498d1 +INFO - '2022-11-11' - botocore.auth - Signature: +4d059b2a44990b949ca6dfa79098b66b56c5d7b39192f5b22a63fe9ef45d9e19 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'BaY8vYwtA4PqqJvvHbcLZegZjRysci8xKQx1qxhj7iLQ0sIh6aAsRqKTqYlA5Mmfs0OAGfMCSKI=', 'x-amz-request-id': 'N4GJYQPHVWXPBGZ2', 'Date': 'Fri, 11 Nov 2022 00:41:11 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180428T000000, start_date=20221111T004110, end_date=20221111T004112 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-04-28T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:41:12.287064Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "883c7830-b2f2-497e-b395-2ce9fcbc85bb"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..4959e96e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:41:04.416827Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d96397de-af6d-3f2e-ab46-a0ff4bccbd69"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d96397de-af6d-3f2e-ab46-a0ff4bccbd69"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "481f3ba1-39c4-4a52-b40a-5f1ba8806a1b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-04-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:41:04.416827+00:00, try_number=1, job_id=403, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-28 00:00:00+00:00 +INFO - Started process 3223 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-04-28T00:00:00+00:00', '--job-id', '403', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpkh7xktvq'] +INFO - Job 403: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-28T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180428T000000, start_date=20221111T004104, end_date=20221111T004111 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-04-28T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:41:11.494920Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "481f3ba1-39c4-4a52-b40a-5f1ba8806a1b"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..f499ed5b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:41:04.437910Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d96397de-af6d-3f2e-ab46-a0ff4bccbd69"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d96397de-af6d-3f2e-ab46-a0ff4bccbd69"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ab1f4903-279c-4b56-a343-9a9f94442b9b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-04-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:41:04.437910+00:00, try_number=1, job_id=404, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-28 00:00:00+00:00 +INFO - Started process 3224 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-04-28T00:00:00+00:00', '--job-id', '404', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp0blscdml'] +INFO - Job 404: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-28T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180428T000000, start_date=20221111T004104, end_date=20221111T004107 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-04-28T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:41:07.560888Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ab1f4903-279c-4b56-a343-9a9f94442b9b"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..ada205ea --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:41:17.245662Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-29T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5d11244d-145f-3804-982f-15afde707fef"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5d11244d-145f-3804-982f-15afde707fef"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ea38b968-a899-46c5-b858-a906c1f584d6"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-04-29T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:41:17.245662+00:00, try_number=1, job_id=407, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-29 00:00:00+00:00 +INFO - Started process 3184 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-04-29T00:00:00+00:00', '--job-id', '407', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp712ofx4b'] +INFO - Job 407: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-29T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-29T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180429T000000, start_date=20221111T004117, end_date=20221111T004119 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-04-29T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:41:19.990816Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ea38b968-a899-46c5-b858-a906c1f584d6"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..b99693cc --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:41:17.246495Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-29T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5d11244d-145f-3804-982f-15afde707fef"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5d11244d-145f-3804-982f-15afde707fef"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f46ee1a4-06bc-431b-91ea-1c8924ad70bb"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-04-29T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:41:17.246495+00:00, try_number=1, job_id=408, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-29 00:00:00+00:00 +INFO - Started process 3185 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-04-29T00:00:00+00:00', '--job-id', '408', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpy5szq2lz'] +INFO - Job 408: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-29T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-29T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180429T000000, start_date=20221111T004117, end_date=20221111T004120 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-04-29T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:41:20.143816Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f46ee1a4-06bc-431b-91ea-1c8924ad70bb"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..fe7af74d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:41:29.993489Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-29T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5d11244d-145f-3804-982f-15afde707fef"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5d11244d-145f-3804-982f-15afde707fef"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "65850bbb-c2ae-429c-b5c8-48e3ee603204"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-04-29T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:41:29.993489+00:00, try_number=1, job_id=412, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-29 00:00:00+00:00 +INFO - Started process 3319 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-04-29T00:00:00+00:00', '--job-id', '412', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpfko9mr05'] +INFO - Job 412: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-29T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-29T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6ca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'Db7gB+JznlLrMVIe1RAxdw==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:Db7gB+JznlLrMVIe1RAxdw== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004130Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004130Z +20221111/us-east-1/s3/aws4_request +d169bdfcd4c67c8582828bd426fdcfb1cfbbabe2ba54430ee42a9572a04a9a65 +INFO - '2022-11-11' - botocore.auth - Signature: +4afc4f4de0b3e8516387f3b42dd48083e5ae716335b5111e4cc5a7767836aa14 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'IowwfaRkuRCszfSZDlBRQgNBMYyUZt4SWHIIbE7YcR0YR8lDtzPn1dnmPsxNUB1YhV9vwnArIV8=', 'x-amz-request-id': '5SZH33CN9ZGZW1RV', 'Date': 'Fri, 11 Nov 2022 00:41:31 GMT', 'ETag': '"0dbee007e2739e52eb31521ed5103177"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180429T000000, start_date=20221111T004129, end_date=20221111T004131 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-04-29T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:41:31.726131Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "65850bbb-c2ae-429c-b5c8-48e3ee603204"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..58dfca7c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:41:27.569571Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-29T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5d11244d-145f-3804-982f-15afde707fef"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5d11244d-145f-3804-982f-15afde707fef"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "26038f19-d562-4f7b-95a3-911dcf851c02"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-04-29T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:41:27.569571+00:00, try_number=1, job_id=411, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-29 00:00:00+00:00 +INFO - Started process 3311 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-04-29T00:00:00+00:00', '--job-id', '411', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpzxhf_pjy'] +INFO - Job 411: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-29T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-29T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50073a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004128Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004128Z +20221111/us-east-1/s3/aws4_request +337409469734850e81b8ad54dfbdbf259607ef11f6ac6dbe30efcb473dd4e467 +INFO - '2022-11-11' - botocore.auth - Signature: +c87095c8d16e777e922a3931e99a55c47be7f6164d3b9fb12f6d05fb32bc9349 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'tk0WYXb+CnQT1RKISm5iQ8t/j8/mrEyh870NaxTXnHBd3+qOyiUcqDwZKD78UjU10kLephKQh3o=', 'x-amz-request-id': 'RPQ29K64BBKQT5VD', 'Date': 'Fri, 11 Nov 2022 00:41:28 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180429T000000, start_date=20221111T004127, end_date=20221111T004129 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-04-29T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:41:29.411731Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "26038f19-d562-4f7b-95a3-911dcf851c02"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..80e2606c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:41:22.691663Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-29T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5d11244d-145f-3804-982f-15afde707fef"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5d11244d-145f-3804-982f-15afde707fef"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "15ccfd52-d55a-4da9-ba6e-7a7668fa5701"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-04-29T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:41:22.691663+00:00, try_number=1, job_id=409, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-29 00:00:00+00:00 +INFO - Started process 3302 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-04-29T00:00:00+00:00', '--job-id', '409', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpo8iycs1s'] +INFO - Job 409: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-29T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-29T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180429T000000, start_date=20221111T004122, end_date=20221111T004128 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-04-29T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:41:28.289172Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "15ccfd52-d55a-4da9-ba6e-7a7668fa5701"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..e9b77307 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:41:22.699551Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-29T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5d11244d-145f-3804-982f-15afde707fef"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5d11244d-145f-3804-982f-15afde707fef"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "779f01fc-a7b5-418a-835b-9f5e3f4b5a0e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-04-29T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:41:22.699551+00:00, try_number=1, job_id=410, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-29 00:00:00+00:00 +INFO - Started process 3306 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-04-29T00:00:00+00:00', '--job-id', '410', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp8a0cjlcu'] +INFO - Job 410: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-29T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-29T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180429T000000, start_date=20221111T004122, end_date=20221111T004125 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-04-29T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:41:25.448787Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "779f01fc-a7b5-418a-835b-9f5e3f4b5a0e"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..8d46c4db --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:41:33.833557Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-30T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f86a48d3-5241-3b37-95f4-011011410112"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f86a48d3-5241-3b37-95f4-011011410112"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3f88410e-38c2-4719-b5a2-86fb1aecd86e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-04-30T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:41:33.833557+00:00, try_number=1, job_id=413, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-30 00:00:00+00:00 +INFO - Started process 3195 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-04-30T00:00:00+00:00', '--job-id', '413', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpgf93pq4z'] +INFO - Job 413: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-30T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-30T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180430T000000, start_date=20221111T004133, end_date=20221111T004136 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-04-30T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:41:36.480200Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3f88410e-38c2-4719-b5a2-86fb1aecd86e"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..6488faa2 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:41:33.837883Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-30T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f86a48d3-5241-3b37-95f4-011011410112"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f86a48d3-5241-3b37-95f4-011011410112"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8af7dc6c-91f4-435e-9570-6a0c67cedff6"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-04-30T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:41:33.837883+00:00, try_number=1, job_id=414, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-30 00:00:00+00:00 +INFO - Started process 3193 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-04-30T00:00:00+00:00', '--job-id', '414', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpyh3u13iq'] +INFO - Job 414: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-30T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-30T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180430T000000, start_date=20221111T004133, end_date=20221111T004136 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-04-30T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:41:36.480200Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8af7dc6c-91f4-435e-9570-6a0c67cedff6"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..f0c7d64a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:41:45.725886Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-30T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f86a48d3-5241-3b37-95f4-011011410112"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f86a48d3-5241-3b37-95f4-011011410112"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6bf2b309-2d4c-4bd1-9053-96026c980e1b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-04-30T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:41:45.725886+00:00, try_number=1, job_id=418, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-30 00:00:00+00:00 +INFO - Started process 3332 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-04-30T00:00:00+00:00', '--job-id', '418', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmprl19c3b7'] +INFO - Job 418: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-30T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-30T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa4f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'Db7gB+JznlLrMVIe1RAxdw==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:Db7gB+JznlLrMVIe1RAxdw== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004146Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004146Z +20221111/us-east-1/s3/aws4_request +1c8fc7f1ab2b4857f8e0361c071f28d9ffea28411b9d8c6a0a85ac87552c23c4 +INFO - '2022-11-11' - botocore.auth - Signature: +0aed5220d2a0939672dbe1cb4690451a2770ab7d0ba13ea2c37a65bf1bdf09c5 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '2MJmMdUdI3+WeOLnBVz9WQfoJuIoyWZ3/xuXJe4XC0m6+ZA8R5JiCCSX+1w1uWCvUFmc0F/yHdk=', 'x-amz-request-id': '57CNXJ2464SJ8RSB', 'Date': 'Fri, 11 Nov 2022 00:41:46 GMT', 'ETag': '"0dbee007e2739e52eb31521ed5103177"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180430T000000, start_date=20221111T004145, end_date=20221111T004147 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-04-30T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:41:47.581263Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6bf2b309-2d4c-4bd1-9053-96026c980e1b"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..40361a6d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:41:43.731989Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-30T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f86a48d3-5241-3b37-95f4-011011410112"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f86a48d3-5241-3b37-95f4-011011410112"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ea7f5fcc-7ec4-4667-8c60-714b3006d7c2"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-04-30T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:41:43.731989+00:00, try_number=1, job_id=417, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-30 00:00:00+00:00 +INFO - Started process 3326 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-04-30T00:00:00+00:00', '--job-id', '417', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpiffqg72e'] +INFO - Job 417: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-30T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-30T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50071f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004144Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004144Z +20221111/us-east-1/s3/aws4_request +97e3814cbbb1460eae219960c1396d1241ea8641b9b4e7dc7a47f67c9b1f5ab4 +INFO - '2022-11-11' - botocore.auth - Signature: +88617632a0dc7da932fce121ef7aa5ffd1bb69e0eefbf651c56c5c01c0e09232 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'Nn12EQQXqxJk65j8jEQbEX9rFjjHssyir2VV7ylb+sf4HXSFEP8qHi56Y1gu9mrwOxUeKmiqG0E=', 'x-amz-request-id': '172CKBTG40551348', 'Date': 'Fri, 11 Nov 2022 00:41:45 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180430T000000, start_date=20221111T004143, end_date=20221111T004145 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-04-30T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:41:45.826462Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ea7f5fcc-7ec4-4667-8c60-714b3006d7c2"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..e408c989 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:41:38.964814Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-30T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f86a48d3-5241-3b37-95f4-011011410112"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f86a48d3-5241-3b37-95f4-011011410112"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "369b57b2-a27b-4523-8f54-78ff1be69940"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-04-30T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:41:38.964814+00:00, try_number=1, job_id=415, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-30 00:00:00+00:00 +INFO - Started process 3245 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-04-30T00:00:00+00:00', '--job-id', '415', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpt5jj8n3j'] +INFO - Job 415: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-30T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-30T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180430T000000, start_date=20221111T004138, end_date=20221111T004144 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-04-30T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:41:44.171565Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "369b57b2-a27b-4523-8f54-78ff1be69940"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..4f2c4f36 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-04-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:41:39.111415Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-04-30T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f86a48d3-5241-3b37-95f4-011011410112"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f86a48d3-5241-3b37-95f4-011011410112"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bb7bf285-c3d3-48d1-84a9-90ce825fa248"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-04-30T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:41:39.111415+00:00, try_number=1, job_id=416, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-04-30 00:00:00+00:00 +INFO - Started process 3256 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-04-30T00:00:00+00:00', '--job-id', '416', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpbt85czh4'] +INFO - Job 416: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-04-30T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-04-30T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180430T000000, start_date=20221111T004139, end_date=20221111T004142 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-04-30T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:41:42.058327Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bb7bf285-c3d3-48d1-84a9-90ce825fa248"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..01301192 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:41:49.144751Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42e35f3d-90b7-3fb4-97d0-f40f9597176d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42e35f3d-90b7-3fb4-97d0-f40f9597176d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "85af6000-4c11-4759-b17f-e96c286ecba2"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-05-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:41:49.144751+00:00, try_number=1, job_id=419, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-01 00:00:00+00:00 +INFO - Started process 3342 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-05-01T00:00:00+00:00', '--job-id', '419', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp17bj0nli'] +INFO - Job 419: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180501T000000, start_date=20221111T004149, end_date=20221111T004151 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-05-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:41:51.895921Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "85af6000-4c11-4759-b17f-e96c286ecba2"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..0fb31242 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:41:49.149671Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42e35f3d-90b7-3fb4-97d0-f40f9597176d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42e35f3d-90b7-3fb4-97d0-f40f9597176d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7727708e-d49a-4310-a36c-c65cd2cb04d5"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-05-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:41:49.149671+00:00, try_number=1, job_id=420, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-01 00:00:00+00:00 +INFO - Started process 3344 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-05-01T00:00:00+00:00', '--job-id', '420', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp0dbnso0a'] +INFO - Job 420: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180501T000000, start_date=20221111T004149, end_date=20221111T004151 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-05-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:41:51.898975Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7727708e-d49a-4310-a36c-c65cd2cb04d5"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..214c3618 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:42:01.075219Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42e35f3d-90b7-3fb4-97d0-f40f9597176d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42e35f3d-90b7-3fb4-97d0-f40f9597176d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4adb2fd9-50bf-479e-8321-895a48701d65"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-05-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:42:01.075219+00:00, try_number=1, job_id=424, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-01 00:00:00+00:00 +INFO - Started process 3293 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-05-01T00:00:00+00:00', '--job-id', '424', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp90xrkrhv'] +INFO - Job 424: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'edN8klDxhabm3w4tCefbpQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:edN8klDxhabm3w4tCefbpQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004201Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004201Z +20221111/us-east-1/s3/aws4_request +9fe2ce871bd327fc52db59e1002e8aea8d70c2a30b38d9420046c0aaa9391463 +INFO - '2022-11-11' - botocore.auth - Signature: +0172012899eeb71968c5b506d042023673434044bae2dab800116f9ea088d7ee +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'nN6FQMTZcishD7kEiKkdJDn3zNSiTJttxzTvZFh+tOcfy/bswL2OBn3mudFru+Hk6twovn1Er3A=', 'x-amz-request-id': 'DKPTD8A57HJDX8WE', 'Date': 'Fri, 11 Nov 2022 00:42:02 GMT', 'ETag': '"79d37c9250f185a6e6df0e2d09e7dba5"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180501T000000, start_date=20221111T004201, end_date=20221111T004202 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-05-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:42:02.803123Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4adb2fd9-50bf-479e-8321-895a48701d65"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..af4a8d99 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:41:58.494164Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42e35f3d-90b7-3fb4-97d0-f40f9597176d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42e35f3d-90b7-3fb4-97d0-f40f9597176d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ccf9f06d-332e-429f-b6f4-00860ba7cf45"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-05-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:41:58.494164+00:00, try_number=1, job_id=423, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-01 00:00:00+00:00 +INFO - Started process 3285 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-05-01T00:00:00+00:00', '--job-id', '423', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpnh67ch45'] +INFO - Job 423: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499543a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004159Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004159Z +20221111/us-east-1/s3/aws4_request +a520ae6ace6961a3763101007c5363db069f32e9ab608253999cd7eace28f6cc +INFO - '2022-11-11' - botocore.auth - Signature: +9f10b80801328b38620d10923f7ca2fd4ccb8b3171a73fc62cf433ba383b282c +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'R6JVYO/m4HCHNQXZzcC8OHHHSh1A8JpVvhVSm9nxmWjVk328Pug4MdAGMV0pD4LXk5VRkIKJazg=', 'x-amz-request-id': '7VVJX99EMPFKEG8C', 'Date': 'Fri, 11 Nov 2022 00:41:59 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180501T000000, start_date=20221111T004158, end_date=20221111T004200 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-05-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:42:00.620492Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ccf9f06d-332e-429f-b6f4-00860ba7cf45"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..942cd679 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:41:54.312672Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42e35f3d-90b7-3fb4-97d0-f40f9597176d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42e35f3d-90b7-3fb4-97d0-f40f9597176d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a60cebef-70b5-4cd6-9de4-c58f18aa7bc2"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-05-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:41:54.312672+00:00, try_number=1, job_id=422, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-01 00:00:00+00:00 +INFO - Started process 3280 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-05-01T00:00:00+00:00', '--job-id', '422', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmptimi3qt9'] +INFO - Job 422: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180501T000000, start_date=20221111T004154, end_date=20221111T004159 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-05-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:41:59.509324Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a60cebef-70b5-4cd6-9de4-c58f18aa7bc2"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..5ae43243 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:41:54.309804Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42e35f3d-90b7-3fb4-97d0-f40f9597176d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "42e35f3d-90b7-3fb4-97d0-f40f9597176d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ab498810-d96c-4b55-97f4-8c22be35fa04"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-05-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:41:54.309804+00:00, try_number=1, job_id=421, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-01 00:00:00+00:00 +INFO - Started process 3279 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-05-01T00:00:00+00:00', '--job-id', '421', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpjrvi2d3q'] +INFO - Job 421: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180501T000000, start_date=20221111T004154, end_date=20221111T004156 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-05-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:41:56.923642Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ab498810-d96c-4b55-97f4-8c22be35fa04"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..17099fc0 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:42:04.660870Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b963c6c0-40e0-3469-80be-5eb0a67610ff"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b963c6c0-40e0-3469-80be-5eb0a67610ff"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "78aa8a5c-22f5-497d-82fa-443f6d22c1f2"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-05-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:42:04.660870+00:00, try_number=1, job_id=426, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-02 00:00:00+00:00 +INFO - Started process 3304 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-05-02T00:00:00+00:00', '--job-id', '426', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpzxsccvac'] +INFO - Job 426: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180502T000000, start_date=20221111T004204, end_date=20221111T004207 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-05-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:42:07.493816Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "78aa8a5c-22f5-497d-82fa-443f6d22c1f2"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..6a83ca03 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:42:04.597380Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b963c6c0-40e0-3469-80be-5eb0a67610ff"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b963c6c0-40e0-3469-80be-5eb0a67610ff"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5459c17b-c824-41c5-9e3d-d42226be33f6"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-05-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:42:04.597380+00:00, try_number=1, job_id=425, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-02 00:00:00+00:00 +INFO - Started process 3302 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-05-02T00:00:00+00:00', '--job-id', '425', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpx8hubvfz'] +INFO - Job 425: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180502T000000, start_date=20221111T004204, end_date=20221111T004207 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-05-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:42:07.482198Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5459c17b-c824-41c5-9e3d-d42226be33f6"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..6a6bcbf9 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:42:16.691725Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b963c6c0-40e0-3469-80be-5eb0a67610ff"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b963c6c0-40e0-3469-80be-5eb0a67610ff"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "eec99e55-4276-4e0d-a49c-268d2a7a06f4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-05-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:42:16.691725+00:00, try_number=1, job_id=430, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-02 00:00:00+00:00 +INFO - Started process 3415 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-05-02T00:00:00+00:00', '--job-id', '430', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpehl4i5v4'] +INFO - Job 430: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa3940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'Db7gB+JznlLrMVIe1RAxdw==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:Db7gB+JznlLrMVIe1RAxdw== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004217Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004217Z +20221111/us-east-1/s3/aws4_request +5e59b83ff9be8b3a097b09724c79b0171151fada9b14cc737714e8f51a923c7e +INFO - '2022-11-11' - botocore.auth - Signature: +c8a8361ff84a98377ac4e9d62aaa218f67e9587c66435be46c6b20e49bcedd16 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'zDVi215AK0j54W+qtmH6wxGTmK4D0dR/hKVptgLDspGKhDgjIfbZUIv8yVcYYoTYhYbSX+/o5TQ=', 'x-amz-request-id': 'QKVNR9Z9G4EYZM1Z', 'Date': 'Fri, 11 Nov 2022 00:42:18 GMT', 'ETag': '"0dbee007e2739e52eb31521ed5103177"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180502T000000, start_date=20221111T004216, end_date=20221111T004218 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-05-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:42:18.740502Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "eec99e55-4276-4e0d-a49c-268d2a7a06f4"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..53b37789 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:42:13.807660Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b963c6c0-40e0-3469-80be-5eb0a67610ff"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b963c6c0-40e0-3469-80be-5eb0a67610ff"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "26ed6efa-4ae9-46f6-a43f-e6e59be2882f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-05-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:42:13.807660+00:00, try_number=1, job_id=429, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-02 00:00:00+00:00 +INFO - Started process 3384 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-05-02T00:00:00+00:00', '--job-id', '429', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpigmoau6n'] +INFO - Job 429: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499543a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004214Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004214Z +20221111/us-east-1/s3/aws4_request +b5c61b3bde4ffb965d4d7663566d256aed8e516d7ef8d89763f47eb7509e5b8c +INFO - '2022-11-11' - botocore.auth - Signature: +e576267d3fed33a30d8bbb538c41e7d002d070c1b2653438e8ac0742c33c49b1 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'gDob5vmwQ32JXMY/vELwIc5jEyeqNHcNFSFvSAG1n0Z46NRLIEypIXsrhIKQmGszHTduSW2s5j8=', 'x-amz-request-id': '3CVQ9YEQJHXAS79E', 'Date': 'Fri, 11 Nov 2022 00:42:15 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180502T000000, start_date=20221111T004213, end_date=20221111T004215 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-05-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:42:15.730889Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "26ed6efa-4ae9-46f6-a43f-e6e59be2882f"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..2ae62298 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:42:09.217185Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b963c6c0-40e0-3469-80be-5eb0a67610ff"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b963c6c0-40e0-3469-80be-5eb0a67610ff"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1dc3cc83-e8e4-4b82-8519-2b1902ecf960"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-05-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:42:09.217185+00:00, try_number=1, job_id=428, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-02 00:00:00+00:00 +INFO - Started process 3352 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-05-02T00:00:00+00:00', '--job-id', '428', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpxdbax24f'] +INFO - Job 428: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180502T000000, start_date=20221111T004209, end_date=20221111T004214 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-05-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:42:14.989911Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1dc3cc83-e8e4-4b82-8519-2b1902ecf960"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..d013423c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:42:09.181699Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b963c6c0-40e0-3469-80be-5eb0a67610ff"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b963c6c0-40e0-3469-80be-5eb0a67610ff"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "592ebba5-4870-4d90-9731-ddb33a34b03a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-05-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:42:09.181699+00:00, try_number=1, job_id=427, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-02 00:00:00+00:00 +INFO - Started process 3343 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-05-02T00:00:00+00:00', '--job-id', '427', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpdzpbz43t'] +INFO - Job 427: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180502T000000, start_date=20221111T004209, end_date=20221111T004212 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-05-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:42:12.096719Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "592ebba5-4870-4d90-9731-ddb33a34b03a"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..2293492c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:42:21.676946Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ba74c255-161c-3eff-aafb-fb4b71537fe4"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ba74c255-161c-3eff-aafb-fb4b71537fe4"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "51d00a9d-8752-4a21-95b4-f779cac489b4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-05-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:42:21.676946+00:00, try_number=1, job_id=432, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-03 00:00:00+00:00 +INFO - Started process 3396 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-05-03T00:00:00+00:00', '--job-id', '432', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpo70sstxu'] +INFO - Job 432: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180503T000000, start_date=20221111T004221, end_date=20221111T004224 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-05-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:42:24.786731Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "51d00a9d-8752-4a21-95b4-f779cac489b4"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..faa38227 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:42:21.646221Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ba74c255-161c-3eff-aafb-fb4b71537fe4"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ba74c255-161c-3eff-aafb-fb4b71537fe4"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d92b1d35-1dbe-4d17-b514-e8219b552c13"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-05-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:42:21.646221+00:00, try_number=1, job_id=431, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-03 00:00:00+00:00 +INFO - Started process 3393 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-05-03T00:00:00+00:00', '--job-id', '431', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp95uicmlj'] +INFO - Job 431: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180503T000000, start_date=20221111T004221, end_date=20221111T004224 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-05-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:42:24.715836Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d92b1d35-1dbe-4d17-b514-e8219b552c13"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..0de34655 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:42:33.103972Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ba74c255-161c-3eff-aafb-fb4b71537fe4"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ba74c255-161c-3eff-aafb-fb4b71537fe4"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "19b9dced-a809-43e1-b0bc-9d2ed368bc36"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-05-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:42:33.103972+00:00, try_number=1, job_id=436, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-03 00:00:00+00:00 +INFO - Started process 3418 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-05-03T00:00:00+00:00', '--job-id', '436', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp37tofav1'] +INFO - Job 436: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0ca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'X0b5ju38dOAbdh4DdGIB8w==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:X0b5ju38dOAbdh4DdGIB8w== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004234Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004234Z +20221111/us-east-1/s3/aws4_request +5b9a951c5425b8323c77b4dab72e2b80c8541cebb2bb20799acdec7e3f48666d +INFO - '2022-11-11' - botocore.auth - Signature: +b176901c746a5a6b73eb90bbce4aaca67b80a0583addf2a6eae658fca9798686 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'fa7cfUExAQJ3sR0ZHhN/oKrBlmfprlqjRoiafTxfUSxD6dpDPBgyXgG2ZKFhDDKP0aqnoo6YS0o=', 'x-amz-request-id': '8QNY4BMPX46J1AGQ', 'Date': 'Fri, 11 Nov 2022 00:42:34 GMT', 'ETag': '"5f46f98eedfc74e01b761e03746201f3"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180503T000000, start_date=20221111T004233, end_date=20221111T004235 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-05-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:42:35.132817Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "19b9dced-a809-43e1-b0bc-9d2ed368bc36"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..101fb914 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:42:31.496166Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ba74c255-161c-3eff-aafb-fb4b71537fe4"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ba74c255-161c-3eff-aafb-fb4b71537fe4"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9deed52f-eb32-4637-8ed3-063bf6c1b39b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-05-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:42:31.496166+00:00, try_number=1, job_id=435, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-03 00:00:00+00:00 +INFO - Started process 3411 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-05-03T00:00:00+00:00', '--job-id', '435', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpid1fe4pt'] +INFO - Job 435: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499543a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004232Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004232Z +20221111/us-east-1/s3/aws4_request +21a3872f857628454ebd9d41d685fb0d0cd1525c2527226bf77aac8399a5d631 +INFO - '2022-11-11' - botocore.auth - Signature: +d7ee105a4fb483f82ef829b81f89e71f0a2b1bc8574078b480e18d6545a5d541 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'gKajdDBZa51dcTrd9dGPtlGDaynGKWIeIgPh137jdgP/cxS4RHqQcxurorVDgZKvS+VPh24AM4k=', 'x-amz-request-id': '1SP3GKFVSZMYGWJW', 'Date': 'Fri, 11 Nov 2022 00:42:32 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180503T000000, start_date=20221111T004231, end_date=20221111T004233 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-05-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:42:33.454841Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9deed52f-eb32-4637-8ed3-063bf6c1b39b"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..51edf089 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:42:26.663792Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ba74c255-161c-3eff-aafb-fb4b71537fe4"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ba74c255-161c-3eff-aafb-fb4b71537fe4"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "054b84b4-07a3-4570-87a1-fa6a916c7d19"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-05-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:42:26.663792+00:00, try_number=1, job_id=434, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-03 00:00:00+00:00 +INFO - Started process 3406 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-05-03T00:00:00+00:00', '--job-id', '434', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpaprhm_a3'] +INFO - Job 434: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180503T000000, start_date=20221111T004226, end_date=20221111T004231 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-05-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:42:31.636570Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "054b84b4-07a3-4570-87a1-fa6a916c7d19"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..1220c8c4 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:42:26.657942Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ba74c255-161c-3eff-aafb-fb4b71537fe4"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ba74c255-161c-3eff-aafb-fb4b71537fe4"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5037c87b-d374-4a62-bb32-ea5a59139ec7"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-05-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:42:26.657942+00:00, try_number=1, job_id=433, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-03 00:00:00+00:00 +INFO - Started process 3403 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-05-03T00:00:00+00:00', '--job-id', '433', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp47cv3qbm'] +INFO - Job 433: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180503T000000, start_date=20221111T004226, end_date=20221111T004229 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-05-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:42:29.346369Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5037c87b-d374-4a62-bb32-ea5a59139ec7"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..ef7779da --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:42:37.000347Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e23be9a7-533a-3cfd-b8f5-99652e7b82fb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e23be9a7-533a-3cfd-b8f5-99652e7b82fb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c469c2d4-eee9-4ced-a0c4-32a957169482"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-05-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:42:37.000347+00:00, try_number=1, job_id=437, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-04 00:00:00+00:00 +INFO - Started process 3489 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-05-04T00:00:00+00:00', '--job-id', '437', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp0293kvvx'] +INFO - Job 437: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180504T000000, start_date=20221111T004237, end_date=20221111T004239 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-05-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:42:39.749378Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c469c2d4-eee9-4ced-a0c4-32a957169482"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..61824609 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:42:37.003254Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e23be9a7-533a-3cfd-b8f5-99652e7b82fb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e23be9a7-533a-3cfd-b8f5-99652e7b82fb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "022f8f38-5944-4848-a23a-978659cbe90a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-05-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:42:37.003254+00:00, try_number=1, job_id=438, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-04 00:00:00+00:00 +INFO - Started process 3491 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-05-04T00:00:00+00:00', '--job-id', '438', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpfr5o5ko9'] +INFO - Job 438: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180504T000000, start_date=20221111T004237, end_date=20221111T004239 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-05-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:42:39.823320Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "022f8f38-5944-4848-a23a-978659cbe90a"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..dcb1ecad --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:42:48.576113Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e23be9a7-533a-3cfd-b8f5-99652e7b82fb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e23be9a7-533a-3cfd-b8f5-99652e7b82fb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "05355e5c-3e24-4d70-ab89-fc54bf54dcd1"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-05-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:42:48.576113+00:00, try_number=1, job_id=442, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-04 00:00:00+00:00 +INFO - Started process 3507 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-05-04T00:00:00+00:00', '--job-id', '442', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp_rgf3416'] +INFO - Job 442: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498ef940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'g+6Sjkgs4cZrORUP1qy+Jg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:g+6Sjkgs4cZrORUP1qy+Jg== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004249Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004249Z +20221111/us-east-1/s3/aws4_request +0672dfab3b317d8c0ff90fdd11c80ae66c795a57b872ea67c15173ac6d2d2a8c +INFO - '2022-11-11' - botocore.auth - Signature: +0345a9f667f821bee118f440e077029965091c7786d1149273559c3b82851c81 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'dtB9gbrksgEA1j9C+iXHQ4H6YlZ+KzRjNa08fsHHwxGotLYyO2To/cQc0qZDFsV7zn8bOORBrfs=', 'x-amz-request-id': 'RKRF43WQGCZ5Y2MB', 'Date': 'Fri, 11 Nov 2022 00:42:49 GMT', 'ETag': '"83ee928e482ce1c66b39150fd6acbe26"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180504T000000, start_date=20221111T004248, end_date=20221111T004250 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-05-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:42:50.826200Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "05355e5c-3e24-4d70-ab89-fc54bf54dcd1"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..ab643ac6 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:42:46.844575Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e23be9a7-533a-3cfd-b8f5-99652e7b82fb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e23be9a7-533a-3cfd-b8f5-99652e7b82fb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ab902c0b-7048-4555-9eda-6ebc1c4c017a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-05-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:42:46.844575+00:00, try_number=1, job_id=441, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-04 00:00:00+00:00 +INFO - Started process 3501 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-05-04T00:00:00+00:00', '--job-id', '441', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpuwwqloep'] +INFO - Job 441: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f6249952550> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004247Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004247Z +20221111/us-east-1/s3/aws4_request +296e28b9210d03fe0588036e76c341b0a14403f13721310e03506d42532a911a +INFO - '2022-11-11' - botocore.auth - Signature: +f83b6190f7d1ae77e9cbc64b0baec9a22b7d1ba7f09c5dc8f15976bd81b22d06 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'UZjpn24rXZKzZ9hdYuVeEHpmsejIT5noXxfNjBMAS5O3NbJYY3mdxWE0P0l8Yl6XPz4PsOzG7Uw=', 'x-amz-request-id': 'FDYD3DG58WRQK7TM', 'Date': 'Fri, 11 Nov 2022 00:42:48 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180504T000000, start_date=20221111T004246, end_date=20221111T004249 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-05-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:42:49.151373Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ab902c0b-7048-4555-9eda-6ebc1c4c017a"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..e2774085 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:42:42.216877Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e23be9a7-533a-3cfd-b8f5-99652e7b82fb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e23be9a7-533a-3cfd-b8f5-99652e7b82fb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fc139782-d9b3-4314-8a83-c76d7fc40b3f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-05-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:42:42.216877+00:00, try_number=1, job_id=440, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-04 00:00:00+00:00 +INFO - Started process 3495 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-05-04T00:00:00+00:00', '--job-id', '440', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmph9jy1pou'] +INFO - Job 440: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180504T000000, start_date=20221111T004242, end_date=20221111T004247 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-05-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:42:47.010282Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fc139782-d9b3-4314-8a83-c76d7fc40b3f"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..4988e789 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:42:42.200736Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e23be9a7-533a-3cfd-b8f5-99652e7b82fb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e23be9a7-533a-3cfd-b8f5-99652e7b82fb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e558b385-35b1-4c0a-8768-0f0e742cd7fa"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-05-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:42:42.200736+00:00, try_number=1, job_id=439, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-04 00:00:00+00:00 +INFO - Started process 3494 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-05-04T00:00:00+00:00', '--job-id', '439', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp9_zz9fgu'] +INFO - Job 439: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180504T000000, start_date=20221111T004242, end_date=20221111T004245 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-05-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:42:45.384123Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e558b385-35b1-4c0a-8768-0f0e742cd7fa"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..c31c13d7 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:42:53.176565Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a3096797-0053-37da-a08f-f3ee7517e703"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a3096797-0053-37da-a08f-f3ee7517e703"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0d9c48ab-522b-46e6-84be-c5a398d7f49c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-05-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:42:53.176565+00:00, try_number=1, job_id=444, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-05 00:00:00+00:00 +INFO - Started process 3519 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-05-05T00:00:00+00:00', '--job-id', '444', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpoil2lx45'] +INFO - Job 444: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180505T000000, start_date=20221111T004253, end_date=20221111T004256 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-05-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:42:56.146742Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0d9c48ab-522b-46e6-84be-c5a398d7f49c"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..2b545b52 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:42:53.168048Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a3096797-0053-37da-a08f-f3ee7517e703"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a3096797-0053-37da-a08f-f3ee7517e703"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "96ef8c0b-b1c6-4bbc-a0f5-5f9f5ba2f8da"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-05-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:42:53.168048+00:00, try_number=1, job_id=443, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-05 00:00:00+00:00 +INFO - Started process 3518 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-05-05T00:00:00+00:00', '--job-id', '443', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpkg5pphdo'] +INFO - Job 443: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180505T000000, start_date=20221111T004253, end_date=20221111T004256 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-05-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:42:56.152771Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "96ef8c0b-b1c6-4bbc-a0f5-5f9f5ba2f8da"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..4066962a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:43:04.965383Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a3096797-0053-37da-a08f-f3ee7517e703"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a3096797-0053-37da-a08f-f3ee7517e703"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f993af17-1de8-4fc4-82b5-d5a4604153eb"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-05-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:43:04.965383+00:00, try_number=1, job_id=448, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-05 00:00:00+00:00 +INFO - Started process 3579 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-05-05T00:00:00+00:00', '--job-id', '448', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpspzeld6i'] +INFO - Job 448: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'zY3qSkQ9+O8KZUQQR7s9Eg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:zY3qSkQ9+O8KZUQQR7s9Eg== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004305Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004305Z +20221111/us-east-1/s3/aws4_request +435078c8d3daf4f4e190d7654f39091456bd25b8b51703b9133d5f8148008e92 +INFO - '2022-11-11' - botocore.auth - Signature: +ee229ae16654704f75da8bec0ac12cbda8f617aaaa12df6d23979208aabf6b3b +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'BD+s6dzG+YyQoHMmWa2LMSN9tQOxSnQj0iQQ0fHW2c4nrj2rNQwUZDTpzoydL9s+z2qrH/i23dM=', 'x-amz-request-id': 'FSAG4EM9N7CH6HNZ', 'Date': 'Fri, 11 Nov 2022 00:43:06 GMT', 'ETag': '"cd8dea4a443df8ef0a65441047bb3d12"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180505T000000, start_date=20221111T004304, end_date=20221111T004306 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-05-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:43:06.828089Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f993af17-1de8-4fc4-82b5-d5a4604153eb"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..273be18b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:43:02.724842Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a3096797-0053-37da-a08f-f3ee7517e703"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a3096797-0053-37da-a08f-f3ee7517e703"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0899800e-156c-418b-a3dc-3dfb6f17b90a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-05-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:43:02.724842+00:00, try_number=1, job_id=447, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-05 00:00:00+00:00 +INFO - Started process 3571 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-05-05T00:00:00+00:00', '--job-id', '447', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpqbdc548b'] +INFO - Job 447: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50061f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004303Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004303Z +20221111/us-east-1/s3/aws4_request +8156cedb3e05db5646cc2fca5c2b8d52a003c35e674325501d8bed4d00120853 +INFO - '2022-11-11' - botocore.auth - Signature: +df0de6e92d2e8f59dd2c565b86e84dd24c0af983ecf4f01d5c563d16781f245a +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '25CQazVTfhOOp7XALj6S4+EQPYzlpBN3ZJeUlSeuRHc2LFO5fPvAwirjY1TrkXRAgoVTQ0gWarA=', 'x-amz-request-id': 'WFF1SRN64DXD7WXV', 'Date': 'Fri, 11 Nov 2022 00:43:04 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180505T000000, start_date=20221111T004302, end_date=20221111T004304 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-05-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:43:04.839577Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0899800e-156c-418b-a3dc-3dfb6f17b90a"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..10492175 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:42:58.111892Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a3096797-0053-37da-a08f-f3ee7517e703"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a3096797-0053-37da-a08f-f3ee7517e703"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "85af96ff-ffbf-4b80-a55f-318333c1f4d6"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-05-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:42:58.111892+00:00, try_number=1, job_id=445, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-05 00:00:00+00:00 +INFO - Started process 3564 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-05-05T00:00:00+00:00', '--job-id', '445', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpghqrx4kc'] +INFO - Job 445: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180505T000000, start_date=20221111T004258, end_date=20221111T004303 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-05-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:43:03.455469Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "85af96ff-ffbf-4b80-a55f-318333c1f4d6"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..a65efd87 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:42:58.124557Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a3096797-0053-37da-a08f-f3ee7517e703"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a3096797-0053-37da-a08f-f3ee7517e703"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "87d71f43-4e1b-43da-af2c-ef1116b1471f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-05-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:42:58.124557+00:00, try_number=1, job_id=446, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-05 00:00:00+00:00 +INFO - Started process 3566 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-05-05T00:00:00+00:00', '--job-id', '446', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp4vv4scej'] +INFO - Job 446: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180505T000000, start_date=20221111T004258, end_date=20221111T004300 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-05-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:43:00.974219Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "87d71f43-4e1b-43da-af2c-ef1116b1471f"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..f10663c0 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:43:09.963036Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5c384b33-e2d7-34fc-b047-82d1c3f10274"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5c384b33-e2d7-34fc-b047-82d1c3f10274"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0a54acd7-7007-4564-8942-c0d32ee41862"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-05-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:43:09.963036+00:00, try_number=1, job_id=450, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-06 00:00:00+00:00 +INFO - Started process 3545 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-05-06T00:00:00+00:00', '--job-id', '450', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmphb7o_pm6'] +INFO - Job 450: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180506T000000, start_date=20221111T004309, end_date=20221111T004313 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-05-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:43:13.261843Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0a54acd7-7007-4564-8942-c0d32ee41862"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..d61856d9 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:43:09.969723Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5c384b33-e2d7-34fc-b047-82d1c3f10274"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5c384b33-e2d7-34fc-b047-82d1c3f10274"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "973192af-f0f3-43f4-90bf-86fe3f037c26"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-05-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:43:09.969723+00:00, try_number=1, job_id=449, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-06 00:00:00+00:00 +INFO - Started process 3554 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-05-06T00:00:00+00:00', '--job-id', '449', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpfdbis4j9'] +INFO - Job 449: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180506T000000, start_date=20221111T004309, end_date=20221111T004313 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-05-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:43:13.263618Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "973192af-f0f3-43f4-90bf-86fe3f037c26"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..f697e47d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:43:21.063554Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5c384b33-e2d7-34fc-b047-82d1c3f10274"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5c384b33-e2d7-34fc-b047-82d1c3f10274"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "49695f05-cc8d-44ac-b18b-55ec13f2a15e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-05-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:43:21.063554+00:00, try_number=1, job_id=454, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-06 00:00:00+00:00 +INFO - Started process 3596 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-05-06T00:00:00+00:00', '--job-id', '454', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpvn_iwy13'] +INFO - Job 454: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'hNyfSO0UmS+WxStNtu9U9g==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:hNyfSO0UmS+WxStNtu9U9g== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004322Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004322Z +20221111/us-east-1/s3/aws4_request +8d8be3ca230d38fcb11491a74ca80db38a362d68007d806c50b387c73329ebd0 +INFO - '2022-11-11' - botocore.auth - Signature: +aa7f2caae44b781708d9c9d4eef533a659c143349efb2286e1e68cd42406ee26 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '/E3i/9eL0Kk3FPIb11ygAvdMQr7M4aYl8CBV/6VG6FnS8ps8EmHtRxPRT6AeUd7Z6rTwbGadxhI=', 'x-amz-request-id': '4FBEKP8GTFYW6QZY', 'Date': 'Fri, 11 Nov 2022 00:43:22 GMT', 'ETag': '"84dc9f48ed14992f96c52b4db6ef54f6"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180506T000000, start_date=20221111T004321, end_date=20221111T004323 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-05-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:43:23.363488Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "49695f05-cc8d-44ac-b18b-55ec13f2a15e"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..3e59f0a2 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:43:19.460825Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5c384b33-e2d7-34fc-b047-82d1c3f10274"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5c384b33-e2d7-34fc-b047-82d1c3f10274"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1077e6c1-22ba-43eb-9529-c8d611a00990"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-05-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:43:19.460825+00:00, try_number=1, job_id=453, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-06 00:00:00+00:00 +INFO - Started process 3600 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-05-06T00:00:00+00:00', '--job-id', '453', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmph_28xvwt'] +INFO - Job 453: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498eff70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004320Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004320Z +20221111/us-east-1/s3/aws4_request +a985e4939e5cf5d99175f0ad85024dfd4ae1abce7b67220690b492a2e5642569 +INFO - '2022-11-11' - botocore.auth - Signature: +e65388dcbc7a520a51b4514a20c0986ba275226543f25344f8c1ccc3dbb7fdd1 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'vIAwm3zOmCt9XhlLoS8663fjvTkZp+S5W4Hm/ksOcKMHfkpeg7cjM9T/ltEcK2jpfsAnG7HyXireejJgsYDOjg==', 'x-amz-request-id': 'KE2N691BECC8AVA2', 'Date': 'Fri, 11 Nov 2022 00:43:20 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180506T000000, start_date=20221111T004319, end_date=20221111T004321 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-05-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:43:21.562057Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1077e6c1-22ba-43eb-9529-c8d611a00990"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..340c0093 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:43:15.013565Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5c384b33-e2d7-34fc-b047-82d1c3f10274"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5c384b33-e2d7-34fc-b047-82d1c3f10274"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3c183e74-8de7-477d-b990-097ca0213177"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-05-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:43:15.013565+00:00, try_number=1, job_id=451, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-06 00:00:00+00:00 +INFO - Started process 3589 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-05-06T00:00:00+00:00', '--job-id', '451', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmppmojdfnz'] +INFO - Job 451: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180506T000000, start_date=20221111T004315, end_date=20221111T004319 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-05-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:43:19.359580Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3c183e74-8de7-477d-b990-097ca0213177"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..cdf0b5bc --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:43:15.013565Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5c384b33-e2d7-34fc-b047-82d1c3f10274"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "5c384b33-e2d7-34fc-b047-82d1c3f10274"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e31921de-a98f-4027-b136-1dd03c35a27a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-05-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:43:15.013565+00:00, try_number=1, job_id=452, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-06 00:00:00+00:00 +INFO - Started process 3590 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-05-06T00:00:00+00:00', '--job-id', '452', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmphj400971'] +INFO - Job 452: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180506T000000, start_date=20221111T004315, end_date=20221111T004317 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-05-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:43:17.717638Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e31921de-a98f-4027-b136-1dd03c35a27a"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..3b5772c7 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:43:25.286276Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "95a3b7d7-7991-3081-8c5c-dfdfc5c6065e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "95a3b7d7-7991-3081-8c5c-dfdfc5c6065e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2345ffe8-0605-41f3-bab8-f05686157fb5"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-05-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:43:25.286276+00:00, try_number=1, job_id=456, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-07 00:00:00+00:00 +INFO - Started process 3663 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-05-07T00:00:00+00:00', '--job-id', '456', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpb0caww2k'] +INFO - Job 456: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180507T000000, start_date=20221111T004325, end_date=20221111T004328 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-05-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:43:28.593918Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2345ffe8-0605-41f3-bab8-f05686157fb5"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..12b91aa2 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:43:25.278830Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "95a3b7d7-7991-3081-8c5c-dfdfc5c6065e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "95a3b7d7-7991-3081-8c5c-dfdfc5c6065e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "584a4761-db47-48f6-ad0d-6423cd6bc9b7"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-05-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:43:25.278830+00:00, try_number=1, job_id=455, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-07 00:00:00+00:00 +INFO - Started process 3656 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-05-07T00:00:00+00:00', '--job-id', '455', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp1ho34bz6'] +INFO - Job 455: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180507T000000, start_date=20221111T004325, end_date=20221111T004328 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-05-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:43:28.677563Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "584a4761-db47-48f6-ad0d-6423cd6bc9b7"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..631d519a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:43:38.918231Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "95a3b7d7-7991-3081-8c5c-dfdfc5c6065e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "95a3b7d7-7991-3081-8c5c-dfdfc5c6065e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ed3406d4-4e05-43a2-a71a-78a5d8acea88"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-05-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:43:38.918231+00:00, try_number=1, job_id=460, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-07 00:00:00+00:00 +INFO - Started process 3688 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-05-07T00:00:00+00:00', '--job-id', '460', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp2r9m5kgr'] +INFO - Job 460: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'GCH3ZEDEiGUuGABLU6VzpQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:GCH3ZEDEiGUuGABLU6VzpQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004339Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004339Z +20221111/us-east-1/s3/aws4_request +9bb788104a1a5c00c5da1dd86c77fa329a93f011600570eae449b1750ced42d8 +INFO - '2022-11-11' - botocore.auth - Signature: +3a85e60c1112f15bde7a0f9b5905d8cd65af943fb3618a7760b89360a4f69d88 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'BZAVkj4LkrKROh9KT6tIbEyXMhf0FhAvluhKNahTS4ofdZVhaSGsWq3jM92iKtYHXOsFbNmJNYE=', 'x-amz-request-id': 'Y5V598C0PAWDA4CZ', 'Date': 'Fri, 11 Nov 2022 00:43:40 GMT', 'ETag': '"1821f76440c488652e18004b53a573a5"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180507T000000, start_date=20221111T004338, end_date=20221111T004340 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-05-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:43:40.848856Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ed3406d4-4e05-43a2-a71a-78a5d8acea88"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..a6cfb377 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:43:36.911503Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "95a3b7d7-7991-3081-8c5c-dfdfc5c6065e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "95a3b7d7-7991-3081-8c5c-dfdfc5c6065e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "25eb2f1c-1805-4ee0-90d0-f93b111cf7db"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-05-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:43:36.911503+00:00, try_number=1, job_id=459, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-07 00:00:00+00:00 +INFO - Started process 3607 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-05-07T00:00:00+00:00', '--job-id', '459', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpiv3wwh8x'] +INFO - Job 459: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499521f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004337Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004337Z +20221111/us-east-1/s3/aws4_request +c4846d7721752a3f72dfe908f4e36a7a81397595a0bc783135634b5d4ebae727 +INFO - '2022-11-11' - botocore.auth - Signature: +ddbf67091dd63f702cc405ec05b575e4c4cfd87c67cf24b9c51e11ac7576ba2d +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'NDMfecVsulEhktth1moey7ANmEAGbVjThAxlw4QCmolfdf6gMxqYvGzR+gQlmSOuq++BE7INJ/g=', 'x-amz-request-id': 'J77EAT4Y1QSYS378', 'Date': 'Fri, 11 Nov 2022 00:43:38 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180507T000000, start_date=20221111T004336, end_date=20221111T004338 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-05-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:43:38.719580Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "25eb2f1c-1805-4ee0-90d0-f93b111cf7db"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..62694b2d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:43:30.567367Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "95a3b7d7-7991-3081-8c5c-dfdfc5c6065e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "95a3b7d7-7991-3081-8c5c-dfdfc5c6065e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c7b14847-1011-4bb7-bfe0-3e0f57b3e665"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-05-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:43:30.567367+00:00, try_number=1, job_id=457, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-07 00:00:00+00:00 +INFO - Started process 3680 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-05-07T00:00:00+00:00', '--job-id', '457', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmphhprlkfb'] +INFO - Job 457: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180507T000000, start_date=20221111T004330, end_date=20221111T004337 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-05-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:43:37.496707Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c7b14847-1011-4bb7-bfe0-3e0f57b3e665"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..89907928 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:43:30.715704Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "95a3b7d7-7991-3081-8c5c-dfdfc5c6065e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "95a3b7d7-7991-3081-8c5c-dfdfc5c6065e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8d8655fc-8137-4530-a499-244b8d25c629"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-05-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:43:30.715704+00:00, try_number=1, job_id=458, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-07 00:00:00+00:00 +INFO - Started process 3682 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-05-07T00:00:00+00:00', '--job-id', '458', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpcnze63gs'] +INFO - Job 458: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180507T000000, start_date=20221111T004330, end_date=20221111T004333 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-05-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:43:33.989833Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8d8655fc-8137-4530-a499-244b8d25c629"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..fdc464c8 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:43:43.134880Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8cbde5cc-f2df-33e1-a640-f7a74122ec3b"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8cbde5cc-f2df-33e1-a640-f7a74122ec3b"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "63ec2cc8-0c84-4c37-850b-326911411931"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-05-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:43:43.134880+00:00, try_number=1, job_id=462, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-08 00:00:00+00:00 +INFO - Started process 3678 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-05-08T00:00:00+00:00', '--job-id', '462', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpr7lb_ecl'] +INFO - Job 462: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180508T000000, start_date=20221111T004343, end_date=20221111T004345 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-05-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:43:45.965775Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "63ec2cc8-0c84-4c37-850b-326911411931"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..51dbd8c4 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:43:43.092951Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8cbde5cc-f2df-33e1-a640-f7a74122ec3b"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8cbde5cc-f2df-33e1-a640-f7a74122ec3b"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "23f12048-8fe0-465e-82ee-331023c21b8e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-05-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:43:43.092951+00:00, try_number=1, job_id=461, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-08 00:00:00+00:00 +INFO - Started process 3676 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-05-08T00:00:00+00:00', '--job-id', '461', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpobik27bw'] +INFO - Job 461: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180508T000000, start_date=20221111T004343, end_date=20221111T004345 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-05-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:43:45.957811Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "23f12048-8fe0-465e-82ee-331023c21b8e"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..2cf95b8c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:43:53.826958Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8cbde5cc-f2df-33e1-a640-f7a74122ec3b"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8cbde5cc-f2df-33e1-a640-f7a74122ec3b"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "05ec0f0b-0ecb-453b-bada-fd75b3ed2c13"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-05-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:43:53.826958+00:00, try_number=1, job_id=466, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-08 00:00:00+00:00 +INFO - Started process 3706 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-05-08T00:00:00+00:00', '--job-id', '466', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp08kx4zf0'] +INFO - Job 466: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f1f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'GUwDJSE+tmRx3iwaY36IwQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:GUwDJSE+tmRx3iwaY36IwQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004355Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004355Z +20221111/us-east-1/s3/aws4_request +c1ec8f9113d1abf04fc0d2479a5229eaf7defa89be997b3fbec8ed6a43d09342 +INFO - '2022-11-11' - botocore.auth - Signature: +7feacb85381410fe6dfe273f71a6444964f14fb19de4ba7e4c36219ddbf51b4a +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'OKZEv8y/mFZ7r+kSa9vmfoM1WWyWzFgWBQb7k5rFXNvgDjQRpNVdMD70q/GKz7hDfXH9iD4H2kg=', 'x-amz-request-id': '289F3QKEB6STDM43', 'Date': 'Fri, 11 Nov 2022 00:43:56 GMT', 'ETag': '"194c0325213eb66471de2c1a637e88c1"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180508T000000, start_date=20221111T004353, end_date=20221111T004357 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-05-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:43:57.087994Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "05ec0f0b-0ecb-453b-bada-fd75b3ed2c13"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..14203ccf --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:43:51.680871Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8cbde5cc-f2df-33e1-a640-f7a74122ec3b"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8cbde5cc-f2df-33e1-a640-f7a74122ec3b"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "322eecba-920c-4327-aa64-b4d8ec0aefde"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-05-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:43:51.680871+00:00, try_number=1, job_id=465, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-08 00:00:00+00:00 +INFO - Started process 3698 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-05-08T00:00:00+00:00', '--job-id', '465', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpfiiehw__'] +INFO - Job 465: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499533a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004352Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004352Z +20221111/us-east-1/s3/aws4_request +a59b2a1dd12213dc1df422a80052b239e55bddfdea477a200229dfdb09dd2313 +INFO - '2022-11-11' - botocore.auth - Signature: +d507f8823fd59eeef872c7ef17bba1101999aa986df5ce757fcd53c1184d1737 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'BM/v3kMFPhDHo8HRW1Vv3c3xpRXsUYqLCgxj943R1RjpTuDlfLfJ5U+37PA9zbNGcnIyLithUU8=', 'x-amz-request-id': 'PWNDGB0JFFD17TAG', 'Date': 'Fri, 11 Nov 2022 00:43:52 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180508T000000, start_date=20221111T004351, end_date=20221111T004353 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-05-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:43:53.575923Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "322eecba-920c-4327-aa64-b4d8ec0aefde"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..60ec1da0 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:43:47.465548Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8cbde5cc-f2df-33e1-a640-f7a74122ec3b"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8cbde5cc-f2df-33e1-a640-f7a74122ec3b"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "90b52b14-3ba8-4ceb-b4fd-dfb08347d72c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-05-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:43:47.465548+00:00, try_number=1, job_id=463, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-08 00:00:00+00:00 +INFO - Started process 3692 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-05-08T00:00:00+00:00', '--job-id', '463', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp734_sado'] +INFO - Job 463: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180508T000000, start_date=20221111T004347, end_date=20221111T004352 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-05-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:43:52.290888Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "90b52b14-3ba8-4ceb-b4fd-dfb08347d72c"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..547263eb --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:43:47.465506Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8cbde5cc-f2df-33e1-a640-f7a74122ec3b"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8cbde5cc-f2df-33e1-a640-f7a74122ec3b"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "775fd529-9f45-4f3f-8d68-a9f0310d4428"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-05-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:43:47.465506+00:00, try_number=1, job_id=464, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-08 00:00:00+00:00 +INFO - Started process 3693 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-05-08T00:00:00+00:00', '--job-id', '464', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpi2ynt9js'] +INFO - Job 464: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180508T000000, start_date=20221111T004347, end_date=20221111T004349 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-05-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:43:49.901755Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "775fd529-9f45-4f3f-8d68-a9f0310d4428"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..70ac5669 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:43:59.462918Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "28b9f2ff-32b0-30a1-af6c-935906d7f598"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "28b9f2ff-32b0-30a1-af6c-935906d7f598"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d2b901bb-7cff-4535-8e51-5675ddad1751"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-05-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:43:59.462918+00:00, try_number=1, job_id=467, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-09 00:00:00+00:00 +INFO - Started process 3715 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-05-09T00:00:00+00:00', '--job-id', '467', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpz9p9fsue'] +INFO - Job 467: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180509T000000, start_date=20221111T004359, end_date=20221111T004402 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-05-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:44:02.366345Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d2b901bb-7cff-4535-8e51-5675ddad1751"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..8b321cd0 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:43:59.493216Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "28b9f2ff-32b0-30a1-af6c-935906d7f598"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "28b9f2ff-32b0-30a1-af6c-935906d7f598"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "609ff8f1-a3eb-45c8-a43a-00b104b56dd8"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-05-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:43:59.493216+00:00, try_number=1, job_id=468, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-09 00:00:00+00:00 +INFO - Started process 3717 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-05-09T00:00:00+00:00', '--job-id', '468', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpkc8jkkir'] +INFO - Job 468: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180509T000000, start_date=20221111T004359, end_date=20221111T004403 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-05-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:44:03.412804Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "609ff8f1-a3eb-45c8-a43a-00b104b56dd8"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..75c39564 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:44:13.471523Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "28b9f2ff-32b0-30a1-af6c-935906d7f598"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "28b9f2ff-32b0-30a1-af6c-935906d7f598"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c0280833-4c9c-4426-9d60-e53bdeda394d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-05-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:44:13.471523+00:00, try_number=1, job_id=472, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-09 00:00:00+00:00 +INFO - Started process 3786 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-05-09T00:00:00+00:00', '--job-id', '472', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp_tjpb6_u'] +INFO - Job 472: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0ca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'sl6/Hcb75nnZHpTgzSNckg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:sl6/Hcb75nnZHpTgzSNckg== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004414Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004414Z +20221111/us-east-1/s3/aws4_request +2dbdcd6f97db27161e5476cef746d48438b1f210690fde6d790d8b4c8ac03657 +INFO - '2022-11-11' - botocore.auth - Signature: +5cb6fbd6e3b271af94ba4e145c19913fc1dd238775cd6bebc417cba9b3beabe1 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'wrkZ+SFM2mPz33yVwFpik3Q3WKuoBeIXSgLhLEZYhmyYu37wck0nnc5ra/UnKl0rX+RqTDv/Vvs=', 'x-amz-request-id': 'J1759SNJE34TWNXB', 'Date': 'Fri, 11 Nov 2022 00:44:14 GMT', 'ETag': '"b25ebf1dc6fbe679d91e94e0cd235c92"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180509T000000, start_date=20221111T004413, end_date=20221111T004415 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-05-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:44:15.406902Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c0280833-4c9c-4426-9d60-e53bdeda394d"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..45f2a4e6 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:44:10.862054Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "28b9f2ff-32b0-30a1-af6c-935906d7f598"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "28b9f2ff-32b0-30a1-af6c-935906d7f598"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "00f5ae81-da42-4e71-8445-b13031ad64ed"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-05-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:44:10.862054+00:00, try_number=1, job_id=471, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-09 00:00:00+00:00 +INFO - Started process 3765 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-05-09T00:00:00+00:00', '--job-id', '471', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpqm2y5eu6'] +INFO - Job 471: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50061f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004412Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004412Z +20221111/us-east-1/s3/aws4_request +4c08f5f701fae7ad4d9fef698a2bd3364c7bb95866e1dd9af5ce9a170bc69843 +INFO - '2022-11-11' - botocore.auth - Signature: +e566977b48d7be31ec55ad2bc44e7eef4fa0718409262252c3bc068a59b2dca6 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'NjJ5eX1a7walavzCbj/JJHPEZPtJqIwps7k6t0TlEL84yNptGocdrJTPl4UTaYd265Svult5XxE=', 'x-amz-request-id': 'CZSM48NJ8VGVGY8A', 'Date': 'Fri, 11 Nov 2022 00:44:13 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180509T000000, start_date=20221111T004410, end_date=20221111T004413 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-05-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:44:13.632400Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "00f5ae81-da42-4e71-8445-b13031ad64ed"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..3b84a6c3 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:44:04.442018Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "28b9f2ff-32b0-30a1-af6c-935906d7f598"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "28b9f2ff-32b0-30a1-af6c-935906d7f598"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "37ff8b06-752a-42ac-be2b-68ee1bfef72d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-05-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:44:04.442018+00:00, try_number=1, job_id=469, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-09 00:00:00+00:00 +INFO - Started process 3723 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-05-09T00:00:00+00:00', '--job-id', '469', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpi2rvi2jo'] +INFO - Job 469: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180509T000000, start_date=20221111T004404, end_date=20221111T004410 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-05-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:44:10.973726Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "37ff8b06-752a-42ac-be2b-68ee1bfef72d"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..b6763f6e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:44:05.735549Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "28b9f2ff-32b0-30a1-af6c-935906d7f598"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "28b9f2ff-32b0-30a1-af6c-935906d7f598"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "636895a3-7b56-4f4b-a68f-832a1ec22de1"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-05-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:44:05.735549+00:00, try_number=1, job_id=470, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-09 00:00:00+00:00 +INFO - Started process 3760 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-05-09T00:00:00+00:00', '--job-id', '470', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmplzg_33m0'] +INFO - Job 470: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180509T000000, start_date=20221111T004405, end_date=20221111T004408 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-05-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:44:08.798757Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "636895a3-7b56-4f4b-a68f-832a1ec22de1"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..1d46af98 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:44:18.165375Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "61176de4-0327-3bcf-81b5-2d25d67d47ee"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "61176de4-0327-3bcf-81b5-2d25d67d47ee"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f22cab4d-e7f2-407f-b061-9c08debeacc9"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-05-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:44:18.165375+00:00, try_number=1, job_id=473, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-10 00:00:00+00:00 +INFO - Started process 3802 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-05-10T00:00:00+00:00', '--job-id', '473', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpsv8rhibd'] +INFO - Job 473: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180510T000000, start_date=20221111T004418, end_date=20221111T004420 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-05-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:44:20.885895Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f22cab4d-e7f2-407f-b061-9c08debeacc9"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..cea61195 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:44:18.182107Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "61176de4-0327-3bcf-81b5-2d25d67d47ee"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "61176de4-0327-3bcf-81b5-2d25d67d47ee"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7d0f55bf-b752-4418-9d35-9c1108fb6ff7"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-05-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:44:18.182107+00:00, try_number=1, job_id=474, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-10 00:00:00+00:00 +INFO - Started process 3804 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-05-10T00:00:00+00:00', '--job-id', '474', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpvypcj0oc'] +INFO - Job 474: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180510T000000, start_date=20221111T004418, end_date=20221111T004421 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-05-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:44:21.453371Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7d0f55bf-b752-4418-9d35-9c1108fb6ff7"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..fdc4f778 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:44:32.111364Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "61176de4-0327-3bcf-81b5-2d25d67d47ee"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "61176de4-0327-3bcf-81b5-2d25d67d47ee"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d317776f-1b50-4f7d-be6d-95e43ea023e7"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-05-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:44:32.111364+00:00, try_number=1, job_id=478, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-10 00:00:00+00:00 +INFO - Started process 3842 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-05-10T00:00:00+00:00', '--job-id', '478', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpso2_1j38'] +INFO - Job 478: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'GCH3ZEDEiGUuGABLU6VzpQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:GCH3ZEDEiGUuGABLU6VzpQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004432Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004432Z +20221111/us-east-1/s3/aws4_request +70a1056f649d26ccd2c56c0fe80f329ac867623c35d549c4621ebc6583942174 +INFO - '2022-11-11' - botocore.auth - Signature: +6338a167b13315afce8448f23d93b6d9c631f1bda26387b8df16849b1ebcbd68 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '+tLwsuVAYnqYgSYqzhDLumdUFukys8sG2/cpEm23wM9LSlPC+umspJGAMPhI7BhV5lZ4ZmhgHDU=', 'x-amz-request-id': 'Z1MARYSRT12NAEQ0', 'Date': 'Fri, 11 Nov 2022 00:44:33 GMT', 'ETag': '"1821f76440c488652e18004b53a573a5"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180510T000000, start_date=20221111T004432, end_date=20221111T004433 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-05-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:44:33.905126Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d317776f-1b50-4f7d-be6d-95e43ea023e7"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..0227c45c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:44:28.563899Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "61176de4-0327-3bcf-81b5-2d25d67d47ee"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "61176de4-0327-3bcf-81b5-2d25d67d47ee"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1e03d04e-a478-49af-be9e-f4e637d29041"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-05-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:44:28.563899+00:00, try_number=1, job_id=477, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-10 00:00:00+00:00 +INFO - Started process 3814 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-05-10T00:00:00+00:00', '--job-id', '477', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp4pnz3q8v'] +INFO - Job 477: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499543a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004429Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004429Z +20221111/us-east-1/s3/aws4_request +240ea0f6f0aa709c38b6c8cfb54f4ad74199df1dd6286efa14d2ecebc9c4ae94 +INFO - '2022-11-11' - botocore.auth - Signature: +d54cc7e200c91db45d18a3b17549a8eb5cd5993f3519727aaf4ba3132dcc2fe5 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'wbAKbKBZk7kr3x656R3S7XDb2rCufJxgdfpX73ZRc+YY1seqxAYdoTumtoB5tklRWi0K95jvmf0=', 'x-amz-request-id': '2R2VTK8PCN0A67K5', 'Date': 'Fri, 11 Nov 2022 00:44:30 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180510T000000, start_date=20221111T004428, end_date=20221111T004431 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-05-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:44:31.581074Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1e03d04e-a478-49af-be9e-f4e637d29041"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..b6597783 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:44:23.208566Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "61176de4-0327-3bcf-81b5-2d25d67d47ee"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "61176de4-0327-3bcf-81b5-2d25d67d47ee"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "39110e80-e153-41ec-b25e-0883424eefec"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-05-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:44:23.208566+00:00, try_number=1, job_id=475, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-10 00:00:00+00:00 +INFO - Started process 3810 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-05-10T00:00:00+00:00', '--job-id', '475', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp3wjm9zaj'] +INFO - Job 475: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180510T000000, start_date=20221111T004423, end_date=20221111T004430 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-05-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:44:30.635256Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "39110e80-e153-41ec-b25e-0883424eefec"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..128b2d4f --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:44:23.248349Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "61176de4-0327-3bcf-81b5-2d25d67d47ee"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "61176de4-0327-3bcf-81b5-2d25d67d47ee"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ae625692-9784-4955-8ca5-b7577f46486b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-05-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:44:23.248349+00:00, try_number=1, job_id=476, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-10 00:00:00+00:00 +INFO - Started process 3772 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-05-10T00:00:00+00:00', '--job-id', '476', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp0upigega'] +INFO - Job 476: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180510T000000, start_date=20221111T004423, end_date=20221111T004426 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-05-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:44:26.396319Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ae625692-9784-4955-8ca5-b7577f46486b"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..d4638958 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:44:35.926431Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8b3a412d-f495-32e2-aaa7-5fda9e34b64a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8b3a412d-f495-32e2-aaa7-5fda9e34b64a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e9e00eeb-53a5-4f15-af08-50ba79b3c3f1"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-05-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:44:35.926431+00:00, try_number=1, job_id=479, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-11 00:00:00+00:00 +INFO - Started process 3823 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-05-11T00:00:00+00:00', '--job-id', '479', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp1lxtfncz'] +INFO - Job 479: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180511T000000, start_date=20221111T004435, end_date=20221111T004438 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-05-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:44:38.831357Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e9e00eeb-53a5-4f15-af08-50ba79b3c3f1"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..288e681f --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:44:35.932653Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8b3a412d-f495-32e2-aaa7-5fda9e34b64a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8b3a412d-f495-32e2-aaa7-5fda9e34b64a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1b0dbf03-ac64-413f-95e5-60939b259a4e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-05-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:44:35.932653+00:00, try_number=1, job_id=480, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-11 00:00:00+00:00 +INFO - Started process 3826 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-05-11T00:00:00+00:00', '--job-id', '480', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp3twf7ec_'] +INFO - Job 480: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180511T000000, start_date=20221111T004435, end_date=20221111T004438 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-05-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:44:38.833728Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1b0dbf03-ac64-413f-95e5-60939b259a4e"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..84fb651a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:44:50.155862Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8b3a412d-f495-32e2-aaa7-5fda9e34b64a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8b3a412d-f495-32e2-aaa7-5fda9e34b64a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "db5c1e91-b033-4d70-8a73-5794296b6429"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-05-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:44:50.155862+00:00, try_number=1, job_id=484, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-11 00:00:00+00:00 +INFO - Started process 3866 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-05-11T00:00:00+00:00', '--job-id', '484', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpz5xfh94k'] +INFO - Job 484: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa4f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'KpDoctriTj0Nb9LNw/KJGg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:KpDoctriTj0Nb9LNw/KJGg== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004451Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004451Z +20221111/us-east-1/s3/aws4_request +866aa579421ff6830ca26872f94b06b54e2be3861a2cb1526793bf2a5b6be0db +INFO - '2022-11-11' - botocore.auth - Signature: +01876dec2472dc810cf8910821390c7e74b85eae0d114a9f9bbb91620622d1dc +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'G9U8TgRsajmY9GxIN3loGtNTWkjDTHDxZiSJ4uPMiQuVDGzmnWpDgDXJxm0YkENi8VnjUoVYq9g=', 'x-amz-request-id': 'NSQ4PCGCFCPC1JGP', 'Date': 'Fri, 11 Nov 2022 00:44:51 GMT', 'ETag': '"2a90e872dae24e3d0d6fd2cdc3f2891a"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180511T000000, start_date=20221111T004450, end_date=20221111T004452 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-05-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:44:52.145660Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "db5c1e91-b033-4d70-8a73-5794296b6429"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..5efa76e5 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:44:46.309630Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8b3a412d-f495-32e2-aaa7-5fda9e34b64a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8b3a412d-f495-32e2-aaa7-5fda9e34b64a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d9a38e2d-fadb-49ac-aae7-578bf062755f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-05-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:44:46.309630+00:00, try_number=1, job_id=483, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-11 00:00:00+00:00 +INFO - Started process 3858 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-05-11T00:00:00+00:00', '--job-id', '483', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpqco0f2t3'] +INFO - Job 483: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50073a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004447Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004447Z +20221111/us-east-1/s3/aws4_request +782646b2360f49789a4a2f290c0fe50ed283e6ecd4fad0204ea5f94adb07fec0 +INFO - '2022-11-11' - botocore.auth - Signature: +eeb986487bb237c50c46c7f6be1639a90e8fe69a0077f7c024dbe30a61c98ccf +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'n9e/TYTB+dYB6gYhF0pRRPfmG9odkafsqw40kFTaWgK+WL0/ACNtomAKSo4/a4qa9+gp6X7AsCE=', 'x-amz-request-id': '72PMSY4H5T2XBJZG', 'Date': 'Fri, 11 Nov 2022 00:44:47 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180511T000000, start_date=20221111T004446, end_date=20221111T004448 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-05-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:44:48.409078Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d9a38e2d-fadb-49ac-aae7-578bf062755f"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..b778e1cd --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:44:40.672365Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8b3a412d-f495-32e2-aaa7-5fda9e34b64a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8b3a412d-f495-32e2-aaa7-5fda9e34b64a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2d267657-2778-491b-b5bd-ae5c6ff2c45d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-05-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:44:40.672365+00:00, try_number=1, job_id=481, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-11 00:00:00+00:00 +INFO - Started process 3852 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-05-11T00:00:00+00:00', '--job-id', '481', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpnuwifneu'] +INFO - Job 481: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180511T000000, start_date=20221111T004440, end_date=20221111T004448 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-05-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:44:48.578975Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2d267657-2778-491b-b5bd-ae5c6ff2c45d"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..653029a9 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:44:40.763628Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8b3a412d-f495-32e2-aaa7-5fda9e34b64a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8b3a412d-f495-32e2-aaa7-5fda9e34b64a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "19ab8f85-aadb-40ec-a43e-8c9f2eca5f58"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-05-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:44:40.763628+00:00, try_number=1, job_id=482, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-11 00:00:00+00:00 +INFO - Started process 3853 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-05-11T00:00:00+00:00', '--job-id', '482', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpv57pu_fq'] +INFO - Job 482: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180511T000000, start_date=20221111T004440, end_date=20221111T004443 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-05-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:44:43.910111Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "19ab8f85-aadb-40ec-a43e-8c9f2eca5f58"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..5d8e23bd --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:44:54.678888Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bc9c1498-8ef6-3ba6-9f3e-7f0a54d078bf"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bc9c1498-8ef6-3ba6-9f3e-7f0a54d078bf"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "25fecd7a-f811-4cbb-b18d-b3691382f389"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-05-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:44:54.678888+00:00, try_number=1, job_id=486, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-12 00:00:00+00:00 +INFO - Started process 3876 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-05-12T00:00:00+00:00', '--job-id', '486', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpyd3xyvwx'] +INFO - Job 486: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180512T000000, start_date=20221111T004454, end_date=20221111T004458 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-05-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:44:58.585555Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "25fecd7a-f811-4cbb-b18d-b3691382f389"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..7d3634d0 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:44:54.646005Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bc9c1498-8ef6-3ba6-9f3e-7f0a54d078bf"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bc9c1498-8ef6-3ba6-9f3e-7f0a54d078bf"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cf436dab-9a56-4e30-adb2-bcc842a402b7"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-05-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:44:54.646005+00:00, try_number=1, job_id=485, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-12 00:00:00+00:00 +INFO - Started process 3877 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-05-12T00:00:00+00:00', '--job-id', '485', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp0d0u1_l8'] +INFO - Job 485: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180512T000000, start_date=20221111T004454, end_date=20221111T004458 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-05-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:44:58.584529Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cf436dab-9a56-4e30-adb2-bcc842a402b7"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..bab6f800 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:45:12.908812Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bc9c1498-8ef6-3ba6-9f3e-7f0a54d078bf"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bc9c1498-8ef6-3ba6-9f3e-7f0a54d078bf"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d177a25b-043d-4229-bf5d-47d981029d90"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-05-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:45:12.908812+00:00, try_number=1, job_id=490, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-12 00:00:00+00:00 +INFO - Started process 3883 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-05-12T00:00:00+00:00', '--job-id', '490', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpwhm1n8fv'] +INFO - Job 490: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa4ee0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'KpDoctriTj0Nb9LNw/KJGg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:KpDoctriTj0Nb9LNw/KJGg== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004514Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004514Z +20221111/us-east-1/s3/aws4_request +694104c9b5cc3f7434649aaa6cfa562d1dc1a2ba991652cf996405c79a52294a +INFO - '2022-11-11' - botocore.auth - Signature: +f78e386bcec83a26700077f11b7a7a204fdcf627af459ce3eef305c8ec52be15 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'nAsASPWJHnFWbMPU91hLQ2HX8mk7p/PsiVNtfDOJ2UHap6GH7s5NBDs0uly3Dxan5E/hSjDuizs=', 'x-amz-request-id': 'PHB2TWAG4MHB277S', 'Date': 'Fri, 11 Nov 2022 00:45:15 GMT', 'ETag': '"2a90e872dae24e3d0d6fd2cdc3f2891a"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180512T000000, start_date=20221111T004512, end_date=20221111T004515 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-05-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:45:15.859637Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d177a25b-043d-4229-bf5d-47d981029d90"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..c90612a6 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:45:07.424545Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bc9c1498-8ef6-3ba6-9f3e-7f0a54d078bf"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bc9c1498-8ef6-3ba6-9f3e-7f0a54d078bf"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "aae1bd9d-38a5-4c95-ad73-29e103b7fe33"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-05-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:45:07.424545+00:00, try_number=1, job_id=489, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-12 00:00:00+00:00 +INFO - Started process 3906 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-05-12T00:00:00+00:00', '--job-id', '489', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpoe0qe2k7'] +INFO - Job 489: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499531f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004508Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004508Z +20221111/us-east-1/s3/aws4_request +b3ccbbc0861f7d5c4bd5f9a676d60f96a9041449f493fbaf9474ddc303f6724f +INFO - '2022-11-11' - botocore.auth - Signature: +86a6df3a0f77f71e62677ee63e38950c8b3c653d912545155a03d3e52b594110 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'NMjUW9SsZDwnxq+h656aY+ttzxCx6+MImz/h/HMcoy3hqFFidCZoVBwTHCXDLtC1gqJFZiJstS0=', 'x-amz-request-id': 'PAQ0B3V0MDA4TXEG', 'Date': 'Fri, 11 Nov 2022 00:45:09 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180512T000000, start_date=20221111T004507, end_date=20221111T004509 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-05-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:45:09.955502Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "aae1bd9d-38a5-4c95-ad73-29e103b7fe33"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..b5c8099b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:45:01.461660Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bc9c1498-8ef6-3ba6-9f3e-7f0a54d078bf"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bc9c1498-8ef6-3ba6-9f3e-7f0a54d078bf"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b39b735d-6323-4256-a519-b51203f72f06"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-05-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:45:01.461660+00:00, try_number=1, job_id=488, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-12 00:00:00+00:00 +INFO - Started process 3901 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-05-12T00:00:00+00:00', '--job-id', '488', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp05112qj7'] +INFO - Job 488: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180512T000000, start_date=20221111T004501, end_date=20221111T004510 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-05-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:45:10.758539Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b39b735d-6323-4256-a519-b51203f72f06"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..ac06d23c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:45:01.503470Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bc9c1498-8ef6-3ba6-9f3e-7f0a54d078bf"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bc9c1498-8ef6-3ba6-9f3e-7f0a54d078bf"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "95589de3-391a-4465-9a14-5e4924a60351"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-05-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:45:01.503470+00:00, try_number=1, job_id=487, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-12 00:00:00+00:00 +INFO - Started process 3900 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-05-12T00:00:00+00:00', '--job-id', '487', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmphwobynqq'] +INFO - Job 487: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180512T000000, start_date=20221111T004501, end_date=20221111T004504 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-05-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:45:04.845582Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "95589de3-391a-4465-9a14-5e4924a60351"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..47ad6c91 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:45:19.415359Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0afd9ba4-b3b1-3ebb-bb76-9f571bae6a23"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0afd9ba4-b3b1-3ebb-bb76-9f571bae6a23"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fa2acbbf-3c3b-4b24-815e-5961f851db58"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-05-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:45:19.415359+00:00, try_number=1, job_id=491, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-13 00:00:00+00:00 +INFO - Started process 3891 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-05-13T00:00:00+00:00', '--job-id', '491', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmppyd8vptk'] +INFO - Job 491: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180513T000000, start_date=20221111T004519, end_date=20221111T004522 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-05-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:45:22.918423Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fa2acbbf-3c3b-4b24-815e-5961f851db58"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..52ad9d39 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:45:20.310441Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0afd9ba4-b3b1-3ebb-bb76-9f571bae6a23"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0afd9ba4-b3b1-3ebb-bb76-9f571bae6a23"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c37dfedc-0dae-4fe2-88fe-2619c5f0f2ca"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-05-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:45:20.310441+00:00, try_number=1, job_id=492, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-13 00:00:00+00:00 +INFO - Started process 3894 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-05-13T00:00:00+00:00', '--job-id', '492', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp40_o0dok'] +INFO - Job 492: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180513T000000, start_date=20221111T004520, end_date=20221111T004524 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-05-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:45:24.280497Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c37dfedc-0dae-4fe2-88fe-2619c5f0f2ca"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..db4bb703 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:45:41.174428Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0afd9ba4-b3b1-3ebb-bb76-9f571bae6a23"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0afd9ba4-b3b1-3ebb-bb76-9f571bae6a23"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "731faddc-45af-4843-b4f7-6f9bc1d34cea"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-05-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:45:41.174428+00:00, try_number=1, job_id=496, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-13 00:00:00+00:00 +INFO - Started process 3919 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-05-13T00:00:00+00:00', '--job-id', '496', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpzqlveutv'] +INFO - Job 496: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'hQecBovzqdPrINAiQ8N3dA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:hQecBovzqdPrINAiQ8N3dA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004542Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004542Z +20221111/us-east-1/s3/aws4_request +60ac7c1167158ef320aec1ea4e16f0fb25e6b84627bd28a2f65ff74b9d3f44e6 +INFO - '2022-11-11' - botocore.auth - Signature: +014cbfce887506d935db19eb7955b499aca0d0ccd2f9c2b3ecb419567bb04e1b +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'bTm0b68s9ut1omkfaaFJLVywl+Q7q2vTKs2baZhbXELNjvB767Kpt8rLj28iqcCRuefYqDdqais=', 'x-amz-request-id': '8HP4V8Z51W0AT97J', 'Date': 'Fri, 11 Nov 2022 00:45:42 GMT', 'ETag': '"85079c068bf3a9d3eb20d02243c37774"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180513T000000, start_date=20221111T004541, end_date=20221111T004543 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-05-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:45:43.436719Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "731faddc-45af-4843-b4f7-6f9bc1d34cea"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..8edbd16c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:45:36.805782Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0afd9ba4-b3b1-3ebb-bb76-9f571bae6a23"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0afd9ba4-b3b1-3ebb-bb76-9f571bae6a23"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6e3c0a8f-f445-441c-aebf-f063f60d4ef8"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-05-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:45:36.805782+00:00, try_number=1, job_id=495, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-13 00:00:00+00:00 +INFO - Started process 3969 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-05-13T00:00:00+00:00', '--job-id', '495', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpe_6y58nk'] +INFO - Job 495: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50063a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004538Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004538Z +20221111/us-east-1/s3/aws4_request +c2c2c34162a32d0c2f45ba9677fada9ed61bb97e544dfa4c2ea1a5922feb39ab +INFO - '2022-11-11' - botocore.auth - Signature: +14b0417b75c8bf6ec7e0b7fb4ebb85502e128c553ddb2c54a2c11fffdc33e6ad +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'NlOnbOwa+/TUqLZZ/TktQL8s7nhYKhAvYeykwcYAUaXToGsynVO33OeB6LuQtbfKzKBkM8MQSTg=', 'x-amz-request-id': '2VNR635NDTN6BYV6', 'Date': 'Fri, 11 Nov 2022 00:45:38 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180513T000000, start_date=20221111T004536, end_date=20221111T004539 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-05-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:45:39.602581Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6e3c0a8f-f445-441c-aebf-f063f60d4ef8"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..07b9cb22 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:45:26.818838Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0afd9ba4-b3b1-3ebb-bb76-9f571bae6a23"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0afd9ba4-b3b1-3ebb-bb76-9f571bae6a23"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "afe7aced-7855-4c32-8c7a-949d1da815cb"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-05-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:45:26.818838+00:00, try_number=1, job_id=493, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-13 00:00:00+00:00 +INFO - Started process 3911 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-05-13T00:00:00+00:00', '--job-id', '493', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpfch7wn_1'] +INFO - Job 493: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180513T000000, start_date=20221111T004526, end_date=20221111T004538 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-05-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:45:38.397702Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "afe7aced-7855-4c32-8c7a-949d1da815cb"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..bcc6556c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:45:29.304092Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0afd9ba4-b3b1-3ebb-bb76-9f571bae6a23"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0afd9ba4-b3b1-3ebb-bb76-9f571bae6a23"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7548036d-e2cb-43cc-a57a-5f174d06599e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-05-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:45:29.304092+00:00, try_number=1, job_id=494, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-13 00:00:00+00:00 +INFO - Started process 3914 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-05-13T00:00:00+00:00', '--job-id', '494', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpog_aj9_1'] +INFO - Job 494: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180513T000000, start_date=20221111T004529, end_date=20221111T004533 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-05-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:45:33.687428Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7548036d-e2cb-43cc-a57a-5f174d06599e"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..0bf3453d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:45:46.447597Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2c36f28d-217f-3e2f-a251-e4fd6455cc8c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2c36f28d-217f-3e2f-a251-e4fd6455cc8c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d8519f76-69fc-4e87-a341-7a587c2081b0"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-05-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:45:46.447597+00:00, try_number=1, job_id=498, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-14 00:00:00+00:00 +INFO - Started process 3979 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-05-14T00:00:00+00:00', '--job-id', '498', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpw02idt40'] +INFO - Job 498: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180514T000000, start_date=20221111T004546, end_date=20221111T004549 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-05-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:45:49.363729Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d8519f76-69fc-4e87-a341-7a587c2081b0"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..1ac35887 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:45:46.447692Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2c36f28d-217f-3e2f-a251-e4fd6455cc8c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2c36f28d-217f-3e2f-a251-e4fd6455cc8c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1731da22-fbd7-4239-ab94-723355b11328"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-05-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:45:46.447692+00:00, try_number=1, job_id=497, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-14 00:00:00+00:00 +INFO - Started process 3981 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-05-14T00:00:00+00:00', '--job-id', '497', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpsohsi0gu'] +INFO - Job 497: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180514T000000, start_date=20221111T004546, end_date=20221111T004549 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-05-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:45:49.248539Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1731da22-fbd7-4239-ab94-723355b11328"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..cfb288c4 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:45:57.850904Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2c36f28d-217f-3e2f-a251-e4fd6455cc8c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2c36f28d-217f-3e2f-a251-e4fd6455cc8c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1a2e29dc-5d6f-4940-b1fb-5a36b498714a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-05-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:45:57.850904+00:00, try_number=1, job_id=502, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-14 00:00:00+00:00 +INFO - Started process 3991 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-05-14T00:00:00+00:00', '--job-id', '502', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpzc48pars'] +INFO - Job 502: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f1f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'hQecBovzqdPrINAiQ8N3dA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:hQecBovzqdPrINAiQ8N3dA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004558Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004558Z +20221111/us-east-1/s3/aws4_request +3900498ab6c3773ee3d11811f902167ce5bb85ff44e7115da877935e0939c6fc +INFO - '2022-11-11' - botocore.auth - Signature: +eff654c22f268e4ffebe5b56b5f04031650b7903e8b72b4ef557460b6223c34e +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '72sAAX9KDEdqPqFS7DQLsF+jH7Mqj6oyEB2D3keiSjYDqWQ52X/Ws5DJqbKYVzVNv7TpO8m+1xk=', 'x-amz-request-id': '9JHP1ND02Y84XVBK', 'Date': 'Fri, 11 Nov 2022 00:45:59 GMT', 'ETag': '"85079c068bf3a9d3eb20d02243c37774"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180514T000000, start_date=20221111T004557, end_date=20221111T004559 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-05-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:45:59.793665Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1a2e29dc-5d6f-4940-b1fb-5a36b498714a"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..1c3b8a7c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:45:55.208778Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2c36f28d-217f-3e2f-a251-e4fd6455cc8c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2c36f28d-217f-3e2f-a251-e4fd6455cc8c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c5b9adfa-4489-4c73-be2f-d471f22cf138"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-05-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:45:55.208778+00:00, try_number=1, job_id=501, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-14 00:00:00+00:00 +INFO - Started process 3996 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-05-14T00:00:00+00:00', '--job-id', '501', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpeu6kju_4'] +INFO - Job 501: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50073a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004556Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004556Z +20221111/us-east-1/s3/aws4_request +b60130d5dea8d50f4439e9b4ffb5982367f7928c1f89d417389ec5c61aaee5ef +INFO - '2022-11-11' - botocore.auth - Signature: +3d2ea7f3b488c9c275645eb1e4d231dbf9cf0116599faf5eac457051c2dc9a58 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'veJv5g+wgnWoQsUCmcvxF862X0mh+HzRw08BSb1yMyYkADSFH/l5l0hOrsoUGTzdM5fP7bujDDA=', 'x-amz-request-id': 'WDC0NEPZTHC489SK', 'Date': 'Fri, 11 Nov 2022 00:45:56 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180514T000000, start_date=20221111T004555, end_date=20221111T004557 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-05-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:45:57.119206Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c5b9adfa-4489-4c73-be2f-d471f22cf138"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..af31ade7 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:45:50.816568Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2c36f28d-217f-3e2f-a251-e4fd6455cc8c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2c36f28d-217f-3e2f-a251-e4fd6455cc8c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "be772d19-2748-4301-b26b-8b53b56e30cb"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-05-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:45:50.816568+00:00, try_number=1, job_id=500, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-14 00:00:00+00:00 +INFO - Started process 3990 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-05-14T00:00:00+00:00', '--job-id', '500', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpbw83w7k9'] +INFO - Job 500: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180514T000000, start_date=20221111T004550, end_date=20221111T004556 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-05-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:45:56.265708Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "be772d19-2748-4301-b26b-8b53b56e30cb"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..7019b67c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:45:50.817246Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2c36f28d-217f-3e2f-a251-e4fd6455cc8c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2c36f28d-217f-3e2f-a251-e4fd6455cc8c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "130b4424-01fb-47f1-b256-7f22fb5371c4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-05-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:45:50.817246+00:00, try_number=1, job_id=499, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-14 00:00:00+00:00 +INFO - Started process 3991 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-05-14T00:00:00+00:00', '--job-id', '499', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp4vy8nl5p'] +INFO - Job 499: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180514T000000, start_date=20221111T004550, end_date=20221111T004553 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-05-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:45:53.446960Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "130b4424-01fb-47f1-b256-7f22fb5371c4"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..857e10e1 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:46:03.905372Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "698d45b7-6740-3aa8-8204-d30fc19914dc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "698d45b7-6740-3aa8-8204-d30fc19914dc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b846bafd-f4f5-458c-a2f8-676893181883"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-05-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:46:03.905372+00:00, try_number=1, job_id=503, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-15 00:00:00+00:00 +INFO - Started process 4071 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-05-15T00:00:00+00:00', '--job-id', '503', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp391upxtp'] +INFO - Job 503: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180515T000000, start_date=20221111T004603, end_date=20221111T004607 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-05-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:46:07.287197Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b846bafd-f4f5-458c-a2f8-676893181883"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..53bc9b10 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:46:03.986890Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "698d45b7-6740-3aa8-8204-d30fc19914dc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "698d45b7-6740-3aa8-8204-d30fc19914dc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f9188f60-6533-463b-96f2-7e6433f38a42"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-05-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:46:03.986890+00:00, try_number=1, job_id=504, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-15 00:00:00+00:00 +INFO - Started process 4073 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-05-15T00:00:00+00:00', '--job-id', '504', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpovdxl1l8'] +INFO - Job 504: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180515T000000, start_date=20221111T004603, end_date=20221111T004607 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-05-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:46:07.283994Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f9188f60-6533-463b-96f2-7e6433f38a42"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..28a025bd --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:46:19.447579Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "698d45b7-6740-3aa8-8204-d30fc19914dc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "698d45b7-6740-3aa8-8204-d30fc19914dc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5e293c11-8cd6-4e5c-bb5f-13aaf2c9e2b5"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-05-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:46:19.447579+00:00, try_number=1, job_id=508, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-15 00:00:00+00:00 +INFO - Started process 4086 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-05-15T00:00:00+00:00', '--job-id', '508', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp39vqkz73'] +INFO - Job 508: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6ca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'MGd0zGcNDGQE2civGobqpw==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:MGd0zGcNDGQE2civGobqpw== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004620Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004620Z +20221111/us-east-1/s3/aws4_request +47bbb436d1618715a74264279c8849a1b4685663ae81508310c0022a0bca8959 +INFO - '2022-11-11' - botocore.auth - Signature: +e2d016a0ef205da6f278eaf4aaec02f252c5ee2ea28e3907c3955566593c7f9e +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'LY693qnXu0r2abKlpoO9BH4DicCVdmfCzLATQGj7vFqj+i+WYDv/2h69Q6xsTO6RbQ0mwFcYpXU=', 'x-amz-request-id': '9F5EGBTJ0MWPGSRN', 'Date': 'Fri, 11 Nov 2022 00:46:21 GMT', 'ETag': '"306774cc670d0c6404d9c8af1a86eaa7"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180515T000000, start_date=20221111T004619, end_date=20221111T004621 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-05-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:46:21.774019Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5e293c11-8cd6-4e5c-bb5f-13aaf2c9e2b5"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..b528615d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:46:14.223393Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "698d45b7-6740-3aa8-8204-d30fc19914dc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "698d45b7-6740-3aa8-8204-d30fc19914dc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "84f75ef8-37ea-43d8-b4fe-ce57c9e77a8f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-05-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:46:14.223393+00:00, try_number=1, job_id=507, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-15 00:00:00+00:00 +INFO - Started process 4079 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-05-15T00:00:00+00:00', '--job-id', '507', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpw312pael'] +INFO - Job 507: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50061f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004616Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004616Z +20221111/us-east-1/s3/aws4_request +1188d4ab271d03738ca65a6c05bdd2cb4e009f96bf1d8dd1793d11ca53810c94 +INFO - '2022-11-11' - botocore.auth - Signature: +dec41af1657a7fd979fe2c95cb320a37cc9a43b6a6f981072b0dff6cf8a7eee0 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '57UfNKTHjNLB+VyNCZCVOA8uJQNYKQrfnphbAT7KUVq5bsqifd7xTA//AA2ALaqTwmax1kLxnqU=', 'x-amz-request-id': '908MRBWFTZP1S3EH', 'Date': 'Fri, 11 Nov 2022 00:46:16 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'x-amzn-internal-status': '200', 'Content-Length': '0', 'Server': 'AmazonS3'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180515T000000, start_date=20221111T004614, end_date=20221111T004617 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-05-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:46:17.798478Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "84f75ef8-37ea-43d8-b4fe-ce57c9e77a8f"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..82bef543 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:46:09.212191Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "698d45b7-6740-3aa8-8204-d30fc19914dc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "698d45b7-6740-3aa8-8204-d30fc19914dc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "caae8e97-9a6d-4f99-b76e-a097564c236f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-05-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:46:09.212191+00:00, try_number=1, job_id=506, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-15 00:00:00+00:00 +INFO - Started process 4002 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-05-15T00:00:00+00:00', '--job-id', '506', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp9gpmb7ru'] +INFO - Job 506: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180515T000000, start_date=20221111T004609, end_date=20221111T004616 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-05-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:46:16.090291Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "caae8e97-9a6d-4f99-b76e-a097564c236f"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..58e8ea34 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:46:09.143401Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "698d45b7-6740-3aa8-8204-d30fc19914dc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "698d45b7-6740-3aa8-8204-d30fc19914dc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "144a26fb-8714-4ce9-9761-10b3faa9f350"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-05-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:46:09.143401+00:00, try_number=1, job_id=505, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-15 00:00:00+00:00 +INFO - Started process 4001 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-05-15T00:00:00+00:00', '--job-id', '505', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpwgegruox'] +INFO - Job 505: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180515T000000, start_date=20221111T004609, end_date=20221111T004612 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-05-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:46:12.046049Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "144a26fb-8714-4ce9-9761-10b3faa9f350"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..9e55828a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:46:24.197173Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d10b0080-fc45-3733-a608-8fa547e74aef"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d10b0080-fc45-3733-a608-8fa547e74aef"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ab1aaebc-1272-4333-8e70-ffcebf5d52cf"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-05-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:46:24.197173+00:00, try_number=1, job_id=509, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-16 00:00:00+00:00 +INFO - Started process 4095 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-05-16T00:00:00+00:00', '--job-id', '509', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmplkoze08g'] +INFO - Job 509: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180516T000000, start_date=20221111T004624, end_date=20221111T004627 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-05-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:46:27.347406Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ab1aaebc-1272-4333-8e70-ffcebf5d52cf"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..27c17b4c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:46:24.205728Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d10b0080-fc45-3733-a608-8fa547e74aef"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d10b0080-fc45-3733-a608-8fa547e74aef"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a52c282d-b242-460f-83b9-b1c65f67c696"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-05-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:46:24.205728+00:00, try_number=1, job_id=510, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-16 00:00:00+00:00 +INFO - Started process 4097 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-05-16T00:00:00+00:00', '--job-id', '510', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpg012yv53'] +INFO - Job 510: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180516T000000, start_date=20221111T004624, end_date=20221111T004627 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-05-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:46:27.161991Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a52c282d-b242-460f-83b9-b1c65f67c696"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..5fb0cf97 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:46:38.462758Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d10b0080-fc45-3733-a608-8fa547e74aef"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d10b0080-fc45-3733-a608-8fa547e74aef"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "96d6df9d-9882-4ccb-9e9e-1ca73dafcf0f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-05-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:46:38.462758+00:00, try_number=1, job_id=514, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-16 00:00:00+00:00 +INFO - Started process 4175 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-05-16T00:00:00+00:00', '--job-id', '514', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmppu920qjm'] +INFO - Job 514: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'MGd0zGcNDGQE2civGobqpw==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:MGd0zGcNDGQE2civGobqpw== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004639Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004639Z +20221111/us-east-1/s3/aws4_request +ec82c8584ae66726f48a6f4cf495e3abecc2ab3c250d7ac1f249599e4754fd2d +INFO - '2022-11-11' - botocore.auth - Signature: +bfee47d2afa6a999cb2e0812aeb927cb160391f2253eff3de3a2659d67b2e334 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '+bpruRRGvgTPJg/kVayVATUOnVsg69qeFDfeCW598cnd6oa7expPgymVU9Bhrh1aoMCb3QsuQKU=', 'x-amz-request-id': 'ZJBW792EGKQ3DRTQ', 'Date': 'Fri, 11 Nov 2022 00:46:39 GMT', 'ETag': '"306774cc670d0c6404d9c8af1a86eaa7"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180516T000000, start_date=20221111T004638, end_date=20221111T004640 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-05-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:46:40.258883Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "96d6df9d-9882-4ccb-9e9e-1ca73dafcf0f"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..e75ca5ba --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:46:35.224185Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d10b0080-fc45-3733-a608-8fa547e74aef"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d10b0080-fc45-3733-a608-8fa547e74aef"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c9f76583-a790-4c71-ac83-3179b4a34cfb"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-05-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:46:35.224185+00:00, try_number=1, job_id=513, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-16 00:00:00+00:00 +INFO - Started process 4168 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-05-16T00:00:00+00:00', '--job-id', '513', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpj5nxcllb'] +INFO - Job 513: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50083a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004636Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004636Z +20221111/us-east-1/s3/aws4_request +d14d229d120eb19b29365a7b8e6745c2323d6703bf190e18b67bf2f77de2a824 +INFO - '2022-11-11' - botocore.auth - Signature: +77af735ec85b80c7d2bb7b8f815b1bdadc9929ac9470fd7e3b5c7c2080cd8713 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'uI6vhchFSbkCZzC5ghowq0xNA9r9ZOfCLh07ab3FlXCLd4zfSD4JNWQjv6ADvcDJ6JZGoqWUgkg=', 'x-amz-request-id': '2Y54E8M244XPXVT5', 'Date': 'Fri, 11 Nov 2022 00:46:36 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180516T000000, start_date=20221111T004635, end_date=20221111T004637 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-05-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:46:37.270756Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c9f76583-a790-4c71-ac83-3179b4a34cfb"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..d8fe17bd --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:46:29.442120Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d10b0080-fc45-3733-a608-8fa547e74aef"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d10b0080-fc45-3733-a608-8fa547e74aef"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d843dd44-388e-4221-b55a-7d4afdca8ade"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-05-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:46:29.442120+00:00, try_number=1, job_id=511, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-16 00:00:00+00:00 +INFO - Started process 4076 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-05-16T00:00:00+00:00', '--job-id', '511', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp5pw7t83m'] +INFO - Job 511: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180516T000000, start_date=20221111T004629, end_date=20221111T004637 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-05-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:46:37.069759Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d843dd44-388e-4221-b55a-7d4afdca8ade"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..e963a43d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:46:29.456991Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d10b0080-fc45-3733-a608-8fa547e74aef"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d10b0080-fc45-3733-a608-8fa547e74aef"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9afedd4a-8bd2-4a2c-b4fc-72454990b7b3"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-05-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:46:29.456991+00:00, try_number=1, job_id=512, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-16 00:00:00+00:00 +INFO - Started process 4077 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-05-16T00:00:00+00:00', '--job-id', '512', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmphn4klt08'] +INFO - Job 512: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180516T000000, start_date=20221111T004629, end_date=20221111T004632 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-05-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:46:32.760281Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9afedd4a-8bd2-4a2c-b4fc-72454990b7b3"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..78a63627 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:46:42.450402Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d4110842-2af4-3b6b-b44d-b934318242ef"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d4110842-2af4-3b6b-b44d-b934318242ef"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "64d38e2b-019f-401c-a4b6-e904a4d5136f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-05-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:46:42.450402+00:00, try_number=1, job_id=516, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-17 00:00:00+00:00 +INFO - Started process 4186 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-05-17T00:00:00+00:00', '--job-id', '516', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpm29nee1a'] +INFO - Job 516: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180517T000000, start_date=20221111T004642, end_date=20221111T004645 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-05-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:46:45.112179Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "64d38e2b-019f-401c-a4b6-e904a4d5136f"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..79cdab82 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:46:42.402350Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d4110842-2af4-3b6b-b44d-b934318242ef"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d4110842-2af4-3b6b-b44d-b934318242ef"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6f07ea32-c60f-4dd5-b1ab-71596c19eb2f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-05-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:46:42.402350+00:00, try_number=1, job_id=515, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-17 00:00:00+00:00 +INFO - Started process 4184 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-05-17T00:00:00+00:00', '--job-id', '515', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpqo7j8cn2'] +INFO - Job 515: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180517T000000, start_date=20221111T004642, end_date=20221111T004645 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-05-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:46:45.115481Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6f07ea32-c60f-4dd5-b1ab-71596c19eb2f"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..5845991c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:46:56.717406Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d4110842-2af4-3b6b-b44d-b934318242ef"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d4110842-2af4-3b6b-b44d-b934318242ef"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "46f07162-370c-434c-b4cb-a0caac6f5e7c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-05-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:46:56.717406+00:00, try_number=1, job_id=520, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-17 00:00:00+00:00 +INFO - Started process 4202 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-05-17T00:00:00+00:00', '--job-id', '520', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpni4lnnqp'] +INFO - Job 520: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'ioj1MM1lVTSi0p6NMEFNXA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:ioj1MM1lVTSi0p6NMEFNXA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004657Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004657Z +20221111/us-east-1/s3/aws4_request +5b2a9a3711d8b67dafe1cd0942fe60d228b0bd6181c39079264c229d72e0cd0a +INFO - '2022-11-11' - botocore.auth - Signature: +7073ff1c5ca76f2cc1af4baafc5a9bad1fa9142288f0ab385715e5f1e28f197d +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'zr+8aiBmRnGSVjlXedDDrGkUmZV6n+ywz4mJwx3qSckiSXsuhVEjRCN9TKI8wrvdwoq/BL4755E=', 'x-amz-request-id': '3WFV0NW54GDAEM0F', 'Date': 'Fri, 11 Nov 2022 00:46:58 GMT', 'ETag': '"8a88f530cd655534a2d29e8d30414d5c"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180517T000000, start_date=20221111T004656, end_date=20221111T004658 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-05-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:46:58.595244Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "46f07162-370c-434c-b4cb-a0caac6f5e7c"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..aa5d2da9 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:46:52.776407Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d4110842-2af4-3b6b-b44d-b934318242ef"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d4110842-2af4-3b6b-b44d-b934318242ef"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "950211ad-7922-470d-8da0-10891d5af8b4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-05-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:46:52.776407+00:00, try_number=1, job_id=519, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-17 00:00:00+00:00 +INFO - Started process 4148 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-05-17T00:00:00+00:00', '--job-id', '519', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmptt4zfthm'] +INFO - Job 519: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499521f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004653Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004653Z +20221111/us-east-1/s3/aws4_request +1550f9a1999f687c56d14e09666863ce940dc63e88f7bd06f93c2fe9585c90c7 +INFO - '2022-11-11' - botocore.auth - Signature: +4056809e7cca44c7f9436d233511d140118513a23887feabeadec3f9416b2d06 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'UY6cQnbR+ck+OyOTyt1cx4JXj33CyBu31QcnAL5MEqv5dG/WGb52awTHlL1ZSSWr1GevF9UsbYg=', 'x-amz-request-id': 'CGDAVC13QRSDE88P', 'Date': 'Fri, 11 Nov 2022 00:46:54 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180517T000000, start_date=20221111T004652, end_date=20221111T004655 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-05-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:46:55.153974Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "950211ad-7922-470d-8da0-10891d5af8b4"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..32db7f4a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:46:47.145501Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d4110842-2af4-3b6b-b44d-b934318242ef"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d4110842-2af4-3b6b-b44d-b934318242ef"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a3061345-4882-4626-b1e7-b3c497174e1f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-05-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:46:47.145501+00:00, try_number=1, job_id=518, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-17 00:00:00+00:00 +INFO - Started process 4196 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-05-17T00:00:00+00:00', '--job-id', '518', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp2ubzs3cs'] +INFO - Job 518: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180517T000000, start_date=20221111T004647, end_date=20221111T004654 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-05-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:46:54.925226Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a3061345-4882-4626-b1e7-b3c497174e1f"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..6e7b8afe --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:46:47.143762Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d4110842-2af4-3b6b-b44d-b934318242ef"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d4110842-2af4-3b6b-b44d-b934318242ef"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3f5db7e9-d944-41b2-9cdf-d6f86029bb9c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-05-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:46:47.143762+00:00, try_number=1, job_id=517, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-17 00:00:00+00:00 +INFO - Started process 4194 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-05-17T00:00:00+00:00', '--job-id', '517', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp31ph7uho'] +INFO - Job 517: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180517T000000, start_date=20221111T004647, end_date=20221111T004650 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-05-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:46:50.362876Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3f5db7e9-d944-41b2-9cdf-d6f86029bb9c"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..55209a07 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:47:01.168192Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e912b01c-37dd-3b68-b0ba-fc94190b1e46"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e912b01c-37dd-3b68-b0ba-fc94190b1e46"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6cdb04cb-40c0-4b75-a217-e7b84a5a7f33"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-05-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:47:01.168192+00:00, try_number=1, job_id=521, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-18 00:00:00+00:00 +INFO - Started process 4159 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-05-18T00:00:00+00:00', '--job-id', '521', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpd6fhli0m'] +INFO - Job 521: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180518T000000, start_date=20221111T004701, end_date=20221111T004703 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-05-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:47:03.953331Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6cdb04cb-40c0-4b75-a217-e7b84a5a7f33"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..c75abd6a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:47:01.172552Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e912b01c-37dd-3b68-b0ba-fc94190b1e46"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e912b01c-37dd-3b68-b0ba-fc94190b1e46"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "264e1eea-7a80-45d1-80e1-934fd992c4ea"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-05-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:47:01.172552+00:00, try_number=1, job_id=522, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-18 00:00:00+00:00 +INFO - Started process 4157 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-05-18T00:00:00+00:00', '--job-id', '522', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpoavmlmj2'] +INFO - Job 522: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180518T000000, start_date=20221111T004701, end_date=20221111T004704 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-05-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:47:04.128270Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "264e1eea-7a80-45d1-80e1-934fd992c4ea"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..57536a32 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:47:13.441879Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e912b01c-37dd-3b68-b0ba-fc94190b1e46"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e912b01c-37dd-3b68-b0ba-fc94190b1e46"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ce4014e7-5423-4841-bd2c-49d05be353eb"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-05-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:47:13.441879+00:00, try_number=1, job_id=526, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-18 00:00:00+00:00 +INFO - Started process 4284 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-05-18T00:00:00+00:00', '--job-id', '526', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp1d8a8y3r'] +INFO - Job 526: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'Uib5IMBy4AiP5itLGns+NA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:Uib5IMBy4AiP5itLGns+NA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004714Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004714Z +20221111/us-east-1/s3/aws4_request +a6b4cc15b9dc2971da61007b05794368529d866691389c9b2602c8cb9e9c3243 +INFO - '2022-11-11' - botocore.auth - Signature: +820ffdb64b7cdd3e6437af2daf9a19042641e91b5588d6f85e31f79f4e5daace +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'xmM6461YyDkY5stvWdPRyTEv0y6gmQ1HHXIhC/dWoEGIla+R4RGAtycZjD4frnGjTWj1vMHLqFs=', 'x-amz-request-id': '9JFFE7E70793EVNX', 'Date': 'Fri, 11 Nov 2022 00:47:14 GMT', 'ETag': '"5226f920c072e0088fe62b4b1a7b3e34"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180518T000000, start_date=20221111T004713, end_date=20221111T004715 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-05-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:47:15.236585Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ce4014e7-5423-4841-bd2c-49d05be353eb"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..0f185503 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:47:11.557119Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e912b01c-37dd-3b68-b0ba-fc94190b1e46"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e912b01c-37dd-3b68-b0ba-fc94190b1e46"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "056372b7-e24f-487d-a899-b3aa26921000"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-05-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:47:11.557119+00:00, try_number=1, job_id=525, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-18 00:00:00+00:00 +INFO - Started process 4165 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-05-18T00:00:00+00:00', '--job-id', '525', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmps5w2c1h2'] +INFO - Job 525: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f6249952550> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004712Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004712Z +20221111/us-east-1/s3/aws4_request +6fb0edf6e0460954afa38b70c1026b4ca68213e5072e3fa4803a88097393ff30 +INFO - '2022-11-11' - botocore.auth - Signature: +7fbe780bf94d7b1fe0085feb0c56d7177ec0d71c4d68470ff02bb7a22ffbae49 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'yNX+YllDJDCWwI4847HvnIZYL+X4qg5E8efoMua6rsioFChpRKNu7TxjbDiixaQyrqi2okRsGrM=', 'x-amz-request-id': 'XD9A0MYMCTK7DB3G', 'Date': 'Fri, 11 Nov 2022 00:47:12 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180518T000000, start_date=20221111T004711, end_date=20221111T004713 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-05-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:47:13.271135Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "056372b7-e24f-487d-a899-b3aa26921000"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..884a0071 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:47:06.519852Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e912b01c-37dd-3b68-b0ba-fc94190b1e46"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e912b01c-37dd-3b68-b0ba-fc94190b1e46"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "877b43ed-dc94-41b8-95d8-60ce63c3cbe5"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-05-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:47:06.519852+00:00, try_number=1, job_id=523, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-18 00:00:00+00:00 +INFO - Started process 4278 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-05-18T00:00:00+00:00', '--job-id', '523', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpzwbryxjk'] +INFO - Job 523: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180518T000000, start_date=20221111T004706, end_date=20221111T004711 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-05-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:47:11.810052Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "877b43ed-dc94-41b8-95d8-60ce63c3cbe5"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..3118028e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:47:06.527389Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e912b01c-37dd-3b68-b0ba-fc94190b1e46"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e912b01c-37dd-3b68-b0ba-fc94190b1e46"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fe656a86-9f72-45e3-90b1-e1634360510d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-05-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:47:06.527389+00:00, try_number=1, job_id=524, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-18 00:00:00+00:00 +INFO - Started process 4276 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-05-18T00:00:00+00:00', '--job-id', '524', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpuslynhvo'] +INFO - Job 524: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180518T000000, start_date=20221111T004706, end_date=20221111T004709 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-05-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:47:09.388469Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fe656a86-9f72-45e3-90b1-e1634360510d"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..0783129c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:47:17.389805Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "32806b3b-3599-3b1f-8afa-0cba393e456a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "32806b3b-3599-3b1f-8afa-0cba393e456a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "89a2cfcf-bacc-4721-bb72-bb83c553e2bf"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-05-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:47:17.389805+00:00, try_number=1, job_id=527, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-19 00:00:00+00:00 +INFO - Started process 4293 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-05-19T00:00:00+00:00', '--job-id', '527', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp5cj9z_j3'] +INFO - Job 527: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180519T000000, start_date=20221111T004717, end_date=20221111T004721 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-05-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:47:21.026627Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "89a2cfcf-bacc-4721-bb72-bb83c553e2bf"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..3d060b43 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:47:17.522754Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "32806b3b-3599-3b1f-8afa-0cba393e456a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "32806b3b-3599-3b1f-8afa-0cba393e456a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "df0ecc64-5498-4024-b673-e31ac75ec1a3"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-05-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:47:17.522754+00:00, try_number=1, job_id=528, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-19 00:00:00+00:00 +INFO - Started process 4295 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-05-19T00:00:00+00:00', '--job-id', '528', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpcauhmauh'] +INFO - Job 528: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180519T000000, start_date=20221111T004717, end_date=20221111T004721 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-05-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:47:21.935126Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "df0ecc64-5498-4024-b673-e31ac75ec1a3"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..938e4da7 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:47:37.381287Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "32806b3b-3599-3b1f-8afa-0cba393e456a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "32806b3b-3599-3b1f-8afa-0cba393e456a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5a466f9f-7c16-47d4-9559-9f15d25fbfeb"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-05-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:47:37.381287+00:00, try_number=1, job_id=532, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-19 00:00:00+00:00 +INFO - Started process 4371 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-05-19T00:00:00+00:00', '--job-id', '532', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpff9fd718'] +INFO - Job 532: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa4f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'Uib5IMBy4AiP5itLGns+NA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:Uib5IMBy4AiP5itLGns+NA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004738Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004738Z +20221111/us-east-1/s3/aws4_request +b1f135c4322c3ea94795e9af394c906b5b0cff3cc2df799e8ddde0a89eb7c9ab +INFO - '2022-11-11' - botocore.auth - Signature: +446e2a6b7a322b0731270c1905905e783310e1b2dc14c66d94ae3f1f81b85f4a +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'UYHN/5gAcj+ZLsle1HDfWefCoUDGBIGAgh/sAWkoL31zKb4KaN65yvKFQs0s1RerWaLLyZd8ve4=', 'x-amz-request-id': 'QQJ5JH535X67FRJQ', 'Date': 'Fri, 11 Nov 2022 00:47:38 GMT', 'ETag': '"5226f920c072e0088fe62b4b1a7b3e34"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180519T000000, start_date=20221111T004737, end_date=20221111T004739 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-05-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:47:39.363715Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5a466f9f-7c16-47d4-9559-9f15d25fbfeb"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..a348ddab --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:47:32.257252Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "32806b3b-3599-3b1f-8afa-0cba393e456a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "32806b3b-3599-3b1f-8afa-0cba393e456a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "46134c77-99bb-4cfe-ae32-b6173934ec23"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-05-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:47:32.257252+00:00, try_number=1, job_id=531, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-19 00:00:00+00:00 +INFO - Started process 4241 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-05-19T00:00:00+00:00', '--job-id', '531', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpxs_138kd'] +INFO - Job 531: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499533a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004733Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004733Z +20221111/us-east-1/s3/aws4_request +478642b5336c9cb9e4bfe5783364496896b4330c3bdc9dfa61addbbdf2a23f4c +INFO - '2022-11-11' - botocore.auth - Signature: +c068efaf3c1a8a9314bc1ceb2d59818f5f7e984b836ac2a7b05962564fd2f338 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'FHLU7nLuqZzu4ccFFeELlU4LUlXeB72OFDswPSO1Y1nXI/Ok2Fz3MoYbfovdso7I4EsQuaxzIJM=', 'x-amz-request-id': 'KZ9FQ460DT9ZT59Q', 'Date': 'Fri, 11 Nov 2022 00:47:33 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180519T000000, start_date=20221111T004732, end_date=20221111T004734 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-05-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:47:34.566344Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "46134c77-99bb-4cfe-ae32-b6173934ec23"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..a49275a1 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:47:24.093373Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "32806b3b-3599-3b1f-8afa-0cba393e456a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "32806b3b-3599-3b1f-8afa-0cba393e456a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1e962231-48ef-4a69-99b7-a075c0f9d406"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-05-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:47:24.093373+00:00, try_number=1, job_id=529, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-19 00:00:00+00:00 +INFO - Started process 4237 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-05-19T00:00:00+00:00', '--job-id', '529', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp8g5dejsj'] +INFO - Job 529: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180519T000000, start_date=20221111T004724, end_date=20221111T004734 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-05-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:47:34.749529Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1e962231-48ef-4a69-99b7-a075c0f9d406"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..bb71567a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:47:25.118289Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "32806b3b-3599-3b1f-8afa-0cba393e456a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "32806b3b-3599-3b1f-8afa-0cba393e456a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6c8d5199-8b7b-458a-81fd-fc6d4c1c1c7b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-05-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:47:25.118289+00:00, try_number=1, job_id=530, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-19 00:00:00+00:00 +INFO - Started process 4301 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-05-19T00:00:00+00:00', '--job-id', '530', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp3xcq45z8'] +INFO - Job 530: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180519T000000, start_date=20221111T004725, end_date=20221111T004729 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-05-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:47:29.721965Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6c8d5199-8b7b-458a-81fd-fc6d4c1c1c7b"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..87e6291a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:47:41.329195Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6b66f1e5-a63d-3a99-804b-6f3e008c0d6a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6b66f1e5-a63d-3a99-804b-6f3e008c0d6a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7a6b0430-b266-49f4-8bcf-87982312033f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-05-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:47:41.329195+00:00, try_number=1, job_id=534, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-20 00:00:00+00:00 +INFO - Started process 4382 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-05-20T00:00:00+00:00', '--job-id', '534', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmptjfbrcb8'] +INFO - Job 534: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180520T000000, start_date=20221111T004741, end_date=20221111T004744 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-05-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:47:44.093350Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7a6b0430-b266-49f4-8bcf-87982312033f"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..b4cde3e2 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:47:41.320433Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6b66f1e5-a63d-3a99-804b-6f3e008c0d6a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6b66f1e5-a63d-3a99-804b-6f3e008c0d6a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2e959816-8568-4d81-bb2c-00bc2e62c9a7"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-05-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:47:41.320433+00:00, try_number=1, job_id=533, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-20 00:00:00+00:00 +INFO - Started process 4380 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-05-20T00:00:00+00:00', '--job-id', '533', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpmy681nhm'] +INFO - Job 533: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180520T000000, start_date=20221111T004741, end_date=20221111T004744 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-05-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:47:44.034610Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2e959816-8568-4d81-bb2c-00bc2e62c9a7"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..56c902e4 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:47:53.815104Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6b66f1e5-a63d-3a99-804b-6f3e008c0d6a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6b66f1e5-a63d-3a99-804b-6f3e008c0d6a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3384b079-6b82-4379-8c91-d66bf223cdeb"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-05-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:47:53.815104+00:00, try_number=1, job_id=538, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-20 00:00:00+00:00 +INFO - Started process 4388 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-05-20T00:00:00+00:00', '--job-id', '538', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpo554wiwf'] +INFO - Job 538: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'Uib5IMBy4AiP5itLGns+NA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:Uib5IMBy4AiP5itLGns+NA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004754Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004754Z +20221111/us-east-1/s3/aws4_request +44b386cb2a11cd5198297f9bb9ff51364e01ebe1ab947ef7a1821765a8336331 +INFO - '2022-11-11' - botocore.auth - Signature: +59c2ce99ff1aac2c456522ae11dfe4791495e1925ef274f87ae57f1545a770c5 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'JS/nRsjmccb28mMF4BGAvVudUduKMDpdGjr5wxZqILK5fjYsV2Fe4BtMpjgKSXeoaV+3u1Re/gU=', 'x-amz-request-id': 'S425N93DG5ETBCY6', 'Date': 'Fri, 11 Nov 2022 00:47:55 GMT', 'ETag': '"5226f920c072e0088fe62b4b1a7b3e34"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180520T000000, start_date=20221111T004753, end_date=20221111T004755 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-05-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:47:55.882404Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3384b079-6b82-4379-8c91-d66bf223cdeb"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..f2137360 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:47:50.773002Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6b66f1e5-a63d-3a99-804b-6f3e008c0d6a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6b66f1e5-a63d-3a99-804b-6f3e008c0d6a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0d65d60f-f9aa-44a2-b5c0-d45bc77bfa65"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-05-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:47:50.773002+00:00, try_number=1, job_id=537, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-20 00:00:00+00:00 +INFO - Started process 4293 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-05-20T00:00:00+00:00', '--job-id', '537', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpd5lpl1hk'] +INFO - Job 537: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f6249954550> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004751Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004751Z +20221111/us-east-1/s3/aws4_request +3c2247caa31b2eaa8e5b3f56403a7d5955e959562ec6c5e2c12194d4fd47a445 +INFO - '2022-11-11' - botocore.auth - Signature: +12d9a6f4f95b888f4bbe5027f25cdd2abf5588305b6a0c5fb5a61c084495408b +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'LnMAL5l5QuE0tmlvgs+rLwuNtjJQS/vQF5S+OGPKlrGvjxiSGH5X1fHr/uw9rXjQDcsI5+SwvVQ=', 'x-amz-request-id': 'PD9W5ZR5A4BHJ4QR', 'Date': 'Fri, 11 Nov 2022 00:47:52 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180520T000000, start_date=20221111T004750, end_date=20221111T004752 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-05-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:47:52.965596Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0d65d60f-f9aa-44a2-b5c0-d45bc77bfa65"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..eef00f76 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:47:45.825268Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6b66f1e5-a63d-3a99-804b-6f3e008c0d6a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6b66f1e5-a63d-3a99-804b-6f3e008c0d6a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9c802dd7-fad0-497b-9a59-f5c422ca51bb"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-05-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:47:45.825268+00:00, try_number=1, job_id=536, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-20 00:00:00+00:00 +INFO - Started process 4253 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-05-20T00:00:00+00:00', '--job-id', '536', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp4j9n0txc'] +INFO - Job 536: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180520T000000, start_date=20221111T004745, end_date=20221111T004752 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-05-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:47:52.090129Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9c802dd7-fad0-497b-9a59-f5c422ca51bb"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..2f4db2e8 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:47:45.805868Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6b66f1e5-a63d-3a99-804b-6f3e008c0d6a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6b66f1e5-a63d-3a99-804b-6f3e008c0d6a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7931a14b-fd70-4046-beb9-f1fceacd9905"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-05-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:47:45.805868+00:00, try_number=1, job_id=535, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-20 00:00:00+00:00 +INFO - Started process 4252 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-05-20T00:00:00+00:00', '--job-id', '535', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpe590d_va'] +INFO - Job 535: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180520T000000, start_date=20221111T004745, end_date=20221111T004748 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-05-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:47:48.736971Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7931a14b-fd70-4046-beb9-f1fceacd9905"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..ed7ffc6c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:47:57.764300Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7c3a4ad2-9bc3-310f-9b2e-e5bc13d9f7eb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7c3a4ad2-9bc3-310f-9b2e-e5bc13d9f7eb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "88a2392f-3f87-4259-b28d-7e539bfeef42"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-05-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:47:57.764300+00:00, try_number=1, job_id=540, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-21 00:00:00+00:00 +INFO - Started process 4335 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-05-21T00:00:00+00:00', '--job-id', '540', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpe32d_2_y'] +INFO - Job 540: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180521T000000, start_date=20221111T004757, end_date=20221111T004800 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-05-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:48:00.443461Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "88a2392f-3f87-4259-b28d-7e539bfeef42"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..a0215e2c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:47:57.767419Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7c3a4ad2-9bc3-310f-9b2e-e5bc13d9f7eb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7c3a4ad2-9bc3-310f-9b2e-e5bc13d9f7eb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "01082882-91e1-483d-92d9-deb8e897ebb0"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-05-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:47:57.767419+00:00, try_number=1, job_id=539, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-21 00:00:00+00:00 +INFO - Started process 4332 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-05-21T00:00:00+00:00', '--job-id', '539', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp3_j8ob7y'] +INFO - Job 539: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180521T000000, start_date=20221111T004757, end_date=20221111T004800 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-05-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:48:00.453273Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "01082882-91e1-483d-92d9-deb8e897ebb0"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..d32f2f98 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:48:11.220694Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7c3a4ad2-9bc3-310f-9b2e-e5bc13d9f7eb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7c3a4ad2-9bc3-310f-9b2e-e5bc13d9f7eb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3807f20e-0163-4bc7-a8f8-c6eb26ba46fa"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-05-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:48:11.220694+00:00, try_number=1, job_id=544, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-21 00:00:00+00:00 +INFO - Started process 4460 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-05-21T00:00:00+00:00', '--job-id', '544', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp_6sopytg'] +INFO - Job 544: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'Uib5IMBy4AiP5itLGns+NA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:Uib5IMBy4AiP5itLGns+NA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004812Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004812Z +20221111/us-east-1/s3/aws4_request +d841f8334891ad729f8a38760b7666181644a0cb56c860352be71a9fb1447c77 +INFO - '2022-11-11' - botocore.auth - Signature: +faaaa9183a838a3a0ce4871423546ad07b79c075721ce494d2e937a6b04594c4 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'Z3KV5pPRXENR1ASlcGom2DYDOs7zvLWhxTh00yk2U4AcMnPyimYh4AMTMaHFXkAN1NCObemWW3Y=', 'x-amz-request-id': 'J4SV5J3F9ZK3BDN6', 'Date': 'Fri, 11 Nov 2022 00:48:12 GMT', 'ETag': '"5226f920c072e0088fe62b4b1a7b3e34"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180521T000000, start_date=20221111T004811, end_date=20221111T004813 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-05-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:48:13.580275Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3807f20e-0163-4bc7-a8f8-c6eb26ba46fa"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..1e6ed645 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:48:07.650215Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7c3a4ad2-9bc3-310f-9b2e-e5bc13d9f7eb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7c3a4ad2-9bc3-310f-9b2e-e5bc13d9f7eb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a87a26a9-a2d7-4535-a8fd-676ef029bafa"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-05-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:48:07.650215+00:00, try_number=1, job_id=543, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-21 00:00:00+00:00 +INFO - Started process 4350 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-05-21T00:00:00+00:00', '--job-id', '543', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp_185q_zy'] +INFO - Job 543: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499531f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004808Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004808Z +20221111/us-east-1/s3/aws4_request +ea0db53ddf22a665d86350f5727f9166fa553dd05e379458d01ae5512ec2ea90 +INFO - '2022-11-11' - botocore.auth - Signature: +35e45d6b007c662fce1267df23cfd855f3588b2f2c759934de7db952b6aadcb5 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '4Zv4eqLXGyS58epqJerA6oSkHVmXG9orVUQyOo8spM5reyi3ymv5i2on1pMVSXbkgNilDumVeTQ=', 'x-amz-request-id': 'VZ0SK1WQC7GM34RH', 'Date': 'Fri, 11 Nov 2022 00:48:09 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180521T000000, start_date=20221111T004807, end_date=20221111T004809 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-05-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:48:09.812008Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a87a26a9-a2d7-4535-a8fd-676ef029bafa"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..6a8a792f --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:48:02.291212Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7c3a4ad2-9bc3-310f-9b2e-e5bc13d9f7eb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7c3a4ad2-9bc3-310f-9b2e-e5bc13d9f7eb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "66e5c8ac-ab0e-473d-a168-14cdf2fbce01"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-05-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:48:02.291212+00:00, try_number=1, job_id=542, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-21 00:00:00+00:00 +INFO - Started process 4345 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-05-21T00:00:00+00:00', '--job-id', '542', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpodht8q61'] +INFO - Job 542: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180521T000000, start_date=20221111T004802, end_date=20221111T004808 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-05-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:48:08.769269Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "66e5c8ac-ab0e-473d-a168-14cdf2fbce01"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..f3b71abb --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:48:02.291212Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7c3a4ad2-9bc3-310f-9b2e-e5bc13d9f7eb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7c3a4ad2-9bc3-310f-9b2e-e5bc13d9f7eb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7a8ba4fa-cf99-4725-98dc-9fd18a7e728b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-05-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:48:02.291212+00:00, try_number=1, job_id=541, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-21 00:00:00+00:00 +INFO - Started process 4344 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-05-21T00:00:00+00:00', '--job-id', '541', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp9hjanl4o'] +INFO - Job 541: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180521T000000, start_date=20221111T004802, end_date=20221111T004804 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-05-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:48:04.767055Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7a8ba4fa-cf99-4725-98dc-9fd18a7e728b"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..872102e5 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:48:15.566272Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "71275bc7-9978-3813-889b-f1555204e317"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "71275bc7-9978-3813-889b-f1555204e317"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8594298c-a383-4925-beb8-39922534d6cb"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-05-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:48:15.566272+00:00, try_number=1, job_id=545, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-22 00:00:00+00:00 +INFO - Started process 4469 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-05-22T00:00:00+00:00', '--job-id', '545', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpn15tuooh'] +INFO - Job 545: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180522T000000, start_date=20221111T004815, end_date=20221111T004818 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-05-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:48:18.277746Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8594298c-a383-4925-beb8-39922534d6cb"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..3c9955a0 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:48:15.568433Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "71275bc7-9978-3813-889b-f1555204e317"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "71275bc7-9978-3813-889b-f1555204e317"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5afc698b-73b4-4af7-a6c9-29d3dc119033"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-05-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:48:15.568433+00:00, try_number=1, job_id=546, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-22 00:00:00+00:00 +INFO - Started process 4471 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-05-22T00:00:00+00:00', '--job-id', '546', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpy083y1z0'] +INFO - Job 546: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180522T000000, start_date=20221111T004815, end_date=20221111T004818 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-05-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:48:18.293393Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5afc698b-73b4-4af7-a6c9-29d3dc119033"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..67e1e7df --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:48:28.066055Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "71275bc7-9978-3813-889b-f1555204e317"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "71275bc7-9978-3813-889b-f1555204e317"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3e2aea38-c31b-427d-acd1-89e10b82c0e9"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-05-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:48:28.066055+00:00, try_number=1, job_id=550, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-22 00:00:00+00:00 +INFO - Started process 4430 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-05-22T00:00:00+00:00', '--job-id', '550', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpre6owj0g'] +INFO - Job 550: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0ca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'MO17RpO3nnG42k97cTzFbQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:MO17RpO3nnG42k97cTzFbQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004828Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004828Z +20221111/us-east-1/s3/aws4_request +0a923d9215aa0c0a3c0bdc845ffb1b07bb7907476e933a3991c601c551ecb936 +INFO - '2022-11-11' - botocore.auth - Signature: +8eabfde4a8081c8524ea86a040f93fdf503b867b166382f792c406daae11198d +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'tPVhyHuXmDcJ6G9dZ7O9C96ekvOqMq252/sMn6sduoIG8/vJjHQ9WGZv3KgRVyk3svc1eFOccg4=', 'x-amz-request-id': 'TD18XZR7D4D0N1QS', 'Date': 'Fri, 11 Nov 2022 00:48:29 GMT', 'ETag': '"30ed7b4693b79e71b8da4f7b713cc56d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180522T000000, start_date=20221111T004828, end_date=20221111T004829 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-05-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:48:29.846974Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3e2aea38-c31b-427d-acd1-89e10b82c0e9"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..7bc00d09 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:48:25.406294Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "71275bc7-9978-3813-889b-f1555204e317"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "71275bc7-9978-3813-889b-f1555204e317"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "442daa8c-671f-456f-b437-06c5807b9364"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-05-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:48:25.406294+00:00, try_number=1, job_id=549, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-22 00:00:00+00:00 +INFO - Started process 4423 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-05-22T00:00:00+00:00', '--job-id', '549', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpmhp2mra1'] +INFO - Job 549: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499531f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004826Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004826Z +20221111/us-east-1/s3/aws4_request +106e65d4a792e41af951d68b6664c43dd301e5484c7678ad72f031f10bd410bd +INFO - '2022-11-11' - botocore.auth - Signature: +e19544deff9a3f55d597d31d093340b07d7963c6bf041591b76df5ed7b8d637d +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'tMrvnkZl3Pj3s7civA89FQwpXXD8w/GHkUqFZBcNzkHlKc0g3LsNmIYgEeWzjQ9LR8k+QNQsmQraf3W3Ef5SAw==', 'x-amz-request-id': '148G097R6VAGM6VR', 'Date': 'Fri, 11 Nov 2022 00:48:26 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180522T000000, start_date=20221111T004825, end_date=20221111T004827 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-05-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:48:27.536029Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "442daa8c-671f-456f-b437-06c5807b9364"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..d8a18189 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:48:20.419525Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "71275bc7-9978-3813-889b-f1555204e317"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "71275bc7-9978-3813-889b-f1555204e317"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "80544fa0-6ebb-4a79-9560-db2be3cd8f36"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-05-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:48:20.419525+00:00, try_number=1, job_id=548, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-22 00:00:00+00:00 +INFO - Started process 4481 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-05-22T00:00:00+00:00', '--job-id', '548', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpyg885vbi'] +INFO - Job 548: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180522T000000, start_date=20221111T004820, end_date=20221111T004826 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-05-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:48:26.329967Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "80544fa0-6ebb-4a79-9560-db2be3cd8f36"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..87932ca3 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:48:20.401447Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "71275bc7-9978-3813-889b-f1555204e317"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "71275bc7-9978-3813-889b-f1555204e317"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fdb2e6ea-faea-4686-a252-692259e231f1"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-05-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:48:20.401447+00:00, try_number=1, job_id=547, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-22 00:00:00+00:00 +INFO - Started process 4478 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-05-22T00:00:00+00:00', '--job-id', '547', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpomphzo4j'] +INFO - Job 547: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180522T000000, start_date=20221111T004820, end_date=20221111T004823 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-05-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:48:23.375519Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fdb2e6ea-faea-4686-a252-692259e231f1"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..704d52a3 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:48:31.872877Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cbf133a7-a0d8-3424-ad1a-f14f25e264b5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cbf133a7-a0d8-3424-ad1a-f14f25e264b5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f9eefade-b9bd-4eec-8cb7-4ed1d4e9cad1"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-05-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:48:31.872877+00:00, try_number=1, job_id=552, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-23 00:00:00+00:00 +INFO - Started process 4491 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-05-23T00:00:00+00:00', '--job-id', '552', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpts7zic2j'] +INFO - Job 552: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-23T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180523T000000, start_date=20221111T004831, end_date=20221111T004834 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-05-23T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:48:34.517374Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f9eefade-b9bd-4eec-8cb7-4ed1d4e9cad1"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..465ad279 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:48:31.837473Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cbf133a7-a0d8-3424-ad1a-f14f25e264b5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cbf133a7-a0d8-3424-ad1a-f14f25e264b5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e90d153e-e7ae-43ab-8607-05d43ed11a0c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-05-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:48:31.837473+00:00, try_number=1, job_id=551, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-23 00:00:00+00:00 +INFO - Started process 4488 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-05-23T00:00:00+00:00', '--job-id', '551', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmps80sv87h'] +INFO - Job 551: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-23T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180523T000000, start_date=20221111T004831, end_date=20221111T004834 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-05-23T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:48:34.576941Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e90d153e-e7ae-43ab-8607-05d43ed11a0c"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..158cc49a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:48:45.802279Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cbf133a7-a0d8-3424-ad1a-f14f25e264b5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cbf133a7-a0d8-3424-ad1a-f14f25e264b5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "10eeb640-cf60-4552-bf16-4f5afc64ccd9"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-05-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:48:45.802279+00:00, try_number=1, job_id=556, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-23 00:00:00+00:00 +INFO - Started process 4572 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-05-23T00:00:00+00:00', '--job-id', '556', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpyhnmkopz'] +INFO - Job 556: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-23T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'm51u60jMxRkYpHFXRmo3Kg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:m51u60jMxRkYpHFXRmo3Kg== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004846Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004846Z +20221111/us-east-1/s3/aws4_request +9e7733ad3216710a9d19b2e124e2c7c7c5d3e83ea26e0ee430ca1379ad487238 +INFO - '2022-11-11' - botocore.auth - Signature: +29410ec6bb5b9e58fb44b2898a8fd1cf6a5eb77cefa4781af2a761276aefb1c0 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'GhpDdnpPcXnSksmqRlBznYOvxT8K9dKoQMvHRs59BmbEkBpNrfDH1hX8ii9NRiOkDPOcEzVnJ4E=', 'x-amz-request-id': '7BG2X29999XACB2S', 'Date': 'Fri, 11 Nov 2022 00:48:47 GMT', 'ETag': '"9b9d6eeb48ccc51918a47157466a372a"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180523T000000, start_date=20221111T004845, end_date=20221111T004848 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-05-23T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:48:48.018617Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "10eeb640-cf60-4552-bf16-4f5afc64ccd9"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..9f124038 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:48:41.463049Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cbf133a7-a0d8-3424-ad1a-f14f25e264b5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cbf133a7-a0d8-3424-ad1a-f14f25e264b5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "007e9205-1468-42c5-bd59-4fda5c5c5321"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-05-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:48:41.463049+00:00, try_number=1, job_id=555, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-23 00:00:00+00:00 +INFO - Started process 4437 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-05-23T00:00:00+00:00', '--job-id', '555', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpkozmdhp3'] +INFO - Job 555: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-23T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f6249955550> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004842Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004842Z +20221111/us-east-1/s3/aws4_request +3bca2af094de82e4191c36b6a91ca54ea2790241752bc27d57d94ffa3401c1a9 +INFO - '2022-11-11' - botocore.auth - Signature: +e385ce239419cff049b894aa25f4e0e72cf3607f399df311f09643611904bd40 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '7QCWwKJH8ixY9WwEx6y43vkjco0y5vEwJe72bGRJFrBY6NM/LtoM4+BEVg5aF5hcwQwy3GDRBGw=', 'x-amz-request-id': '67CFBMZS29R287HM', 'Date': 'Fri, 11 Nov 2022 00:48:43 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180523T000000, start_date=20221111T004841, end_date=20221111T004843 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-05-23T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:48:43.717138Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "007e9205-1468-42c5-bd59-4fda5c5c5321"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..10336846 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:48:36.681446Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cbf133a7-a0d8-3424-ad1a-f14f25e264b5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cbf133a7-a0d8-3424-ad1a-f14f25e264b5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e0e9b4e0-adff-4e33-b15a-2627e1f854a7"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-05-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:48:36.681446+00:00, try_number=1, job_id=554, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-23 00:00:00+00:00 +INFO - Started process 4539 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-05-23T00:00:00+00:00', '--job-id', '554', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpwm_tkb1_'] +INFO - Job 554: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-23T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180523T000000, start_date=20221111T004836, end_date=20221111T004844 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-05-23T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:48:44.162459Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e0e9b4e0-adff-4e33-b15a-2627e1f854a7"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..2608453d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:48:36.669490Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cbf133a7-a0d8-3424-ad1a-f14f25e264b5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cbf133a7-a0d8-3424-ad1a-f14f25e264b5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e9183f03-6b51-42be-8bcd-00aee453f167"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-05-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:48:36.669490+00:00, try_number=1, job_id=553, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-23 00:00:00+00:00 +INFO - Started process 4537 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-05-23T00:00:00+00:00', '--job-id', '553', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpygum9sxa'] +INFO - Job 553: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-23T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180523T000000, start_date=20221111T004836, end_date=20221111T004839 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-05-23T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:48:39.676858Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e9183f03-6b51-42be-8bcd-00aee453f167"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..7312eb12 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:48:50.739607Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b361a24d-501c-379f-87a6-54d983687d33"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b361a24d-501c-379f-87a6-54d983687d33"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7549804d-5f33-4a50-9684-52d92e7c677e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-05-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:48:50.739607+00:00, try_number=1, job_id=557, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-24 00:00:00+00:00 +INFO - Started process 4469 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-05-24T00:00:00+00:00', '--job-id', '557', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpuco8byr5'] +INFO - Job 557: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-24T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180524T000000, start_date=20221111T004850, end_date=20221111T004853 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-05-24T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:48:53.823470Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7549804d-5f33-4a50-9684-52d92e7c677e"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..3b1516fe --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:48:50.750724Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b361a24d-501c-379f-87a6-54d983687d33"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b361a24d-501c-379f-87a6-54d983687d33"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "36898267-cfe1-482c-8a4f-e6ba3eeaae13"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-05-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:48:50.750724+00:00, try_number=1, job_id=558, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-24 00:00:00+00:00 +INFO - Started process 4476 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-05-24T00:00:00+00:00', '--job-id', '558', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp_9mam3fc'] +INFO - Job 558: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-24T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180524T000000, start_date=20221111T004850, end_date=20221111T004853 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-05-24T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:48:53.831830Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "36898267-cfe1-482c-8a4f-e6ba3eeaae13"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..8045fb2e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:49:04.280026Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b361a24d-501c-379f-87a6-54d983687d33"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b361a24d-501c-379f-87a6-54d983687d33"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1b1dd651-eb83-4692-8c60-5e4ce087dc02"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-05-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:49:04.280026+00:00, try_number=1, job_id=562, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-24 00:00:00+00:00 +INFO - Started process 4526 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-05-24T00:00:00+00:00', '--job-id', '562', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpfgg34np_'] +INFO - Job 562: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-24T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'MO17RpO3nnG42k97cTzFbQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:MO17RpO3nnG42k97cTzFbQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004905Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004905Z +20221111/us-east-1/s3/aws4_request +2956c1ddc1bfc12109c3c857cf4d08c973dede942c925b5b1c52a1caaa174946 +INFO - '2022-11-11' - botocore.auth - Signature: +729bdf116f99050673e64647eca505afab190aa96beb0e650d1f7e3610d74e88 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'CX8Oays3GqCVIUQzbo8KOZSnFHAxPGDlFVvkFM7M82vS1o0ymyhmySwYT4LjiGI24QWCGTWjVeM=', 'x-amz-request-id': 'E0FE726A18NDCCRR', 'Date': 'Fri, 11 Nov 2022 00:49:05 GMT', 'ETag': '"30ed7b4693b79e71b8da4f7b713cc56d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180524T000000, start_date=20221111T004904, end_date=20221111T004906 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-05-24T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:49:06.405708Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1b1dd651-eb83-4692-8c60-5e4ce087dc02"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..b64506d6 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:49:01.069729Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b361a24d-501c-379f-87a6-54d983687d33"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b361a24d-501c-379f-87a6-54d983687d33"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e386d6da-4add-411a-ba45-20edb2a470bf"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-05-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:49:01.069729+00:00, try_number=1, job_id=561, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-24 00:00:00+00:00 +INFO - Started process 4519 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-05-24T00:00:00+00:00', '--job-id', '561', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp667zn0uy'] +INFO - Job 561: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-24T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499543a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004902Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004902Z +20221111/us-east-1/s3/aws4_request +4aa0849c449b3f38544b216c8a37ac76cc0b0be4d4e01089e0431addbb2548fb +INFO - '2022-11-11' - botocore.auth - Signature: +ae7b7aac2f7545bde66c2b4ab1ac45af9f12c50e4fdfb1d804ce6c595a7c5a10 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'x5L0qFNm17l0QdYUflWC9dNy8kl58YY79TWibSB5walBMdy1Lti3kM2W6572IxpRUxGG2tlquHk=', 'x-amz-request-id': '20XSSTZ69QPQFGV8', 'Date': 'Fri, 11 Nov 2022 00:49:02 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180524T000000, start_date=20221111T004901, end_date=20221111T004903 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-05-24T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:49:03.423229Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e386d6da-4add-411a-ba45-20edb2a470bf"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..450c2a5b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:48:56.106411Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b361a24d-501c-379f-87a6-54d983687d33"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b361a24d-501c-379f-87a6-54d983687d33"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5bf51752-7375-45c7-b6b6-42b62bdd27d1"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-05-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:48:56.106411+00:00, try_number=1, job_id=560, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-24 00:00:00+00:00 +INFO - Started process 4583 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-05-24T00:00:00+00:00', '--job-id', '560', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp2w5l2dfi'] +INFO - Job 560: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-24T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180524T000000, start_date=20221111T004856, end_date=20221111T004902 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-05-24T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:49:02.119552Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5bf51752-7375-45c7-b6b6-42b62bdd27d1"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..102556ca --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:48:56.090806Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b361a24d-501c-379f-87a6-54d983687d33"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b361a24d-501c-379f-87a6-54d983687d33"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "52b39c00-e366-42ca-8bad-ae5b5a1f366e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-05-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:48:56.090806+00:00, try_number=1, job_id=559, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-24 00:00:00+00:00 +INFO - Started process 4581 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-05-24T00:00:00+00:00', '--job-id', '559', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpzqgbcoz5'] +INFO - Job 559: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-24T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180524T000000, start_date=20221111T004856, end_date=20221111T004859 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-05-24T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:48:59.232006Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "52b39c00-e366-42ca-8bad-ae5b5a1f366e"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..9d15797d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:49:09.985691Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7ad50455-1347-36dd-89f6-74e3874560b8"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7ad50455-1347-36dd-89f6-74e3874560b8"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "343f4747-6679-4c51-8718-3d3058647ae2"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-05-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:49:09.985691+00:00, try_number=1, job_id=563, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-25 00:00:00+00:00 +INFO - Started process 4655 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-05-25T00:00:00+00:00', '--job-id', '563', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp_qccyy9q'] +INFO - Job 563: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-25T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180525T000000, start_date=20221111T004909, end_date=20221111T004913 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-05-25T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:49:13.039190Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "343f4747-6679-4c51-8718-3d3058647ae2"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..dff14ef6 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:49:10.286851Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7ad50455-1347-36dd-89f6-74e3874560b8"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7ad50455-1347-36dd-89f6-74e3874560b8"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d566f5d2-068b-40db-9dd4-72766073a554"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-05-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:49:10.286851+00:00, try_number=1, job_id=564, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-25 00:00:00+00:00 +INFO - Started process 4658 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-05-25T00:00:00+00:00', '--job-id', '564', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp0d_q2k_e'] +INFO - Job 564: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-25T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180525T000000, start_date=20221111T004910, end_date=20221111T004913 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-05-25T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:49:13.046669Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d566f5d2-068b-40db-9dd4-72766073a554"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..04ce5416 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:49:23.591455Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7ad50455-1347-36dd-89f6-74e3874560b8"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7ad50455-1347-36dd-89f6-74e3874560b8"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b3bc8a05-e0de-4e18-a250-a74365ca0ac8"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-05-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:49:23.591455+00:00, try_number=1, job_id=568, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-25 00:00:00+00:00 +INFO - Started process 4590 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-05-25T00:00:00+00:00', '--job-id', '568', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp26ta9a81'] +INFO - Job 568: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-25T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498eff70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'MO17RpO3nnG42k97cTzFbQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:MO17RpO3nnG42k97cTzFbQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004924Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004924Z +20221111/us-east-1/s3/aws4_request +df2ea274864aed462110c922cc281cd22c1216b997a4d6161dc6863ce17d2ac0 +INFO - '2022-11-11' - botocore.auth - Signature: +9c9628cabc9637e33b480f4b68dc4e5dd696b70443586f5c6fb191c95ef4cfc3 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '5vSjGM507aebvtdm3qm9N8TnNYFzOzhocAjZSTdYrasEsqerudiia9077vS82HazvNBTni+CMSc=', 'x-amz-request-id': 'T7RCNM76G3ZM4DZG', 'Date': 'Fri, 11 Nov 2022 00:49:24 GMT', 'ETag': '"30ed7b4693b79e71b8da4f7b713cc56d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180525T000000, start_date=20221111T004923, end_date=20221111T004925 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-05-25T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:49:25.374703Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b3bc8a05-e0de-4e18-a250-a74365ca0ac8"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..561a3b9d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:49:20.445969Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7ad50455-1347-36dd-89f6-74e3874560b8"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7ad50455-1347-36dd-89f6-74e3874560b8"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e1708843-6796-4f61-a344-ac57dd214bdb"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-05-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:49:20.445969+00:00, try_number=1, job_id=567, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-25 00:00:00+00:00 +INFO - Started process 4553 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-05-25T00:00:00+00:00', '--job-id', '567', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmph59noo7p'] +INFO - Job 567: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-25T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499531f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004921Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004921Z +20221111/us-east-1/s3/aws4_request +df84140f00790c744477e60a03d7f4afc5abd0552f131161b9f881ad395eb32d +INFO - '2022-11-11' - botocore.auth - Signature: +d14fe0e5bb013a2ee8086ab07a1aae7925f5d1cfc97a207ac7b49dd30d67e741 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'QMPRaoTi1IjL/x/VhKlpZ1cnbYNbSz5bG6EyQyC6q3Qw6ZiYSOprF5Sbtre0OQoQmSSuIe/XH2o=', 'x-amz-request-id': 'BDW2E9J7XYCBK3VB', 'Date': 'Fri, 11 Nov 2022 00:49:21 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180525T000000, start_date=20221111T004920, end_date=20221111T004923 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-05-25T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:49:23.064401Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e1708843-6796-4f61-a344-ac57dd214bdb"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..6566ae48 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:49:14.817897Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7ad50455-1347-36dd-89f6-74e3874560b8"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7ad50455-1347-36dd-89f6-74e3874560b8"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1f87734b-4130-425f-bc6b-279158dc2012"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-05-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:49:14.817897+00:00, try_number=1, job_id=565, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-25 00:00:00+00:00 +INFO - Started process 4665 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-05-25T00:00:00+00:00', '--job-id', '565', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp2iadwwk7'] +INFO - Job 565: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-25T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180525T000000, start_date=20221111T004914, end_date=20221111T004921 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-05-25T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:49:21.228513Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1f87734b-4130-425f-bc6b-279158dc2012"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..10265f0a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:49:15.047157Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7ad50455-1347-36dd-89f6-74e3874560b8"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7ad50455-1347-36dd-89f6-74e3874560b8"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c9a31de4-4877-4df6-acb3-3426943295a9"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-05-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:49:15.047157+00:00, try_number=1, job_id=566, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-25 00:00:00+00:00 +INFO - Started process 4668 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-05-25T00:00:00+00:00', '--job-id', '566', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpvtspqdpt'] +INFO - Job 566: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-25T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180525T000000, start_date=20221111T004915, end_date=20221111T004917 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-05-25T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:49:17.828062Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c9a31de4-4877-4df6-acb3-3426943295a9"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..f6753c21 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:49:27.427673Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "93a1f1ae-cd7b-3d54-be7b-0c2d1257c852"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "93a1f1ae-cd7b-3d54-be7b-0c2d1257c852"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "71fb1110-e363-4610-83c2-9ab28004c1c2"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-05-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:49:27.427673+00:00, try_number=1, job_id=569, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-26 00:00:00+00:00 +INFO - Started process 4675 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-05-26T00:00:00+00:00', '--job-id', '569', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp3_eub9yp'] +INFO - Job 569: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-26T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180526T000000, start_date=20221111T004927, end_date=20221111T004931 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-05-26T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:49:31.122993Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "71fb1110-e363-4610-83c2-9ab28004c1c2"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..c02f054c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:49:27.426664Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "93a1f1ae-cd7b-3d54-be7b-0c2d1257c852"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "93a1f1ae-cd7b-3d54-be7b-0c2d1257c852"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cb8fbd31-dff9-479c-9bfb-78291fbb6ae9"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-05-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:49:27.426664+00:00, try_number=1, job_id=570, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-26 00:00:00+00:00 +INFO - Started process 4678 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-05-26T00:00:00+00:00', '--job-id', '570', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpd_l0g7b_'] +INFO - Job 570: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-26T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180526T000000, start_date=20221111T004927, end_date=20221111T004930 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-05-26T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:49:30.937051Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cb8fbd31-dff9-479c-9bfb-78291fbb6ae9"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..d61815e6 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:49:42.811770Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "93a1f1ae-cd7b-3d54-be7b-0c2d1257c852"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "93a1f1ae-cd7b-3d54-be7b-0c2d1257c852"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d75d83fd-7ab6-4877-961f-73f2cd2545b5"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-05-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:49:42.811770+00:00, try_number=1, job_id=574, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-26 00:00:00+00:00 +INFO - Started process 4754 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-05-26T00:00:00+00:00', '--job-id', '574', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpfpnqf91s'] +INFO - Job 574: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-26T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'EAP1xWOpqa9LfOohFepJ+A==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:EAP1xWOpqa9LfOohFepJ+A== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004943Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004943Z +20221111/us-east-1/s3/aws4_request +608785cbd1b2135a4cebc0a605c3ab37ab05f917f54d779cc53bcf97e63842f9 +INFO - '2022-11-11' - botocore.auth - Signature: +b05df5fd681c02384ca9f653d095af732ecedba6d2a6e5b614906241b3b7fdea +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '6y/pg147/04L6lmQY7u83pUwLdw8C4w5CAMl7qsv6kXO+pcvWqYHZW+tAa7HoJ/U8J5shCmTlTs=', 'x-amz-request-id': 'EF0FZRJBNBRM77BM', 'Date': 'Fri, 11 Nov 2022 00:49:44 GMT', 'ETag': '"1003f5c563a9a9af4b7cea2115ea49f8"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180526T000000, start_date=20221111T004942, end_date=20221111T004944 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-05-26T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:49:44.806468Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d75d83fd-7ab6-4877-961f-73f2cd2545b5"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..53568c63 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:49:37.787920Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "93a1f1ae-cd7b-3d54-be7b-0c2d1257c852"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "93a1f1ae-cd7b-3d54-be7b-0c2d1257c852"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "146682b8-cfef-4d58-9ae7-cb71c5a9e58d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-05-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:49:37.787920+00:00, try_number=1, job_id=573, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-26 00:00:00+00:00 +INFO - Started process 4617 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-05-26T00:00:00+00:00', '--job-id', '573', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp2h6jxul4'] +INFO - Job 573: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-26T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499521f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004938Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004938Z +20221111/us-east-1/s3/aws4_request +8914bdf76398b1d706b072249dca3e1da2f07ed09d7f446024c9b49e58c0b892 +INFO - '2022-11-11' - botocore.auth - Signature: +81be69740a0a6bcf59cd4a08029e68419d6b7ec2644d978df4c42b1d71acb1ea +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'tKABRCbSuejjXLiTVqoWrrdEMxKcONAGTP0kSLCFw0VihdyxZG/gCeNgMNpJ/zqKmowpfvmO0WiFumK/QY5gOw==', 'x-amz-request-id': 'HYNESQZTPZD1HPHC', 'Date': 'Fri, 11 Nov 2022 00:49:39 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180526T000000, start_date=20221111T004937, end_date=20221111T004940 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-05-26T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:49:40.132107Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "146682b8-cfef-4d58-9ae7-cb71c5a9e58d"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..5bd84403 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:49:33.865832Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "93a1f1ae-cd7b-3d54-be7b-0c2d1257c852"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "93a1f1ae-cd7b-3d54-be7b-0c2d1257c852"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "655ce4d1-5635-462e-877f-21945c469f82"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-05-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:49:33.865832+00:00, try_number=1, job_id=572, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-26 00:00:00+00:00 +INFO - Started process 4684 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-05-26T00:00:00+00:00', '--job-id', '572', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpzlz8lll0'] +INFO - Job 572: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-26T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180526T000000, start_date=20221111T004933, end_date=20221111T004940 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-05-26T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:49:40.944061Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "655ce4d1-5635-462e-877f-21945c469f82"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..8d1d471c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:49:32.263333Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "93a1f1ae-cd7b-3d54-be7b-0c2d1257c852"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "93a1f1ae-cd7b-3d54-be7b-0c2d1257c852"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a67c3110-dc1e-49c6-bb44-b1a8034a1b06"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-05-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:49:32.263333+00:00, try_number=1, job_id=571, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-26 00:00:00+00:00 +INFO - Started process 4612 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-05-26T00:00:00+00:00', '--job-id', '571', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp1spjwe8a'] +INFO - Job 571: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-26T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180526T000000, start_date=20221111T004932, end_date=20221111T004935 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-05-26T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:49:35.086937Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a67c3110-dc1e-49c6-bb44-b1a8034a1b06"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..f719c991 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:49:47.429965Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f00db63c-4b60-3311-bb78-239775d0373d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f00db63c-4b60-3311-bb78-239775d0373d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "65ed8ce3-7212-4555-8537-1d35e8ea7ec7"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-05-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:49:47.429965+00:00, try_number=1, job_id=576, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-27 00:00:00+00:00 +INFO - Started process 4628 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-05-27T00:00:00+00:00', '--job-id', '576', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmptulmeyc4'] +INFO - Job 576: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-27T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180527T000000, start_date=20221111T004947, end_date=20221111T004950 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-05-27T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:49:50.082325Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "65ed8ce3-7212-4555-8537-1d35e8ea7ec7"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..a70e2f03 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:49:47.368688Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f00db63c-4b60-3311-bb78-239775d0373d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f00db63c-4b60-3311-bb78-239775d0373d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b074dae4-c35b-4ba8-93d5-e2f149f0ef22"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-05-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:49:47.368688+00:00, try_number=1, job_id=575, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-27 00:00:00+00:00 +INFO - Started process 4626 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-05-27T00:00:00+00:00', '--job-id', '575', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpfbad827u'] +INFO - Job 575: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-27T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180527T000000, start_date=20221111T004947, end_date=20221111T004950 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-05-27T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:49:50.101037Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b074dae4-c35b-4ba8-93d5-e2f149f0ef22"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..19fb46c8 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:50:03.420664Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f00db63c-4b60-3311-bb78-239775d0373d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f00db63c-4b60-3311-bb78-239775d0373d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c439891b-a72d-475d-9367-7b3aac49a997"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-05-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:50:03.420664+00:00, try_number=1, job_id=580, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-27 00:00:00+00:00 +INFO - Started process 4771 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-05-27T00:00:00+00:00', '--job-id', '580', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpx_0w8exe'] +INFO - Job 580: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-27T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'zscYCwwm02G6vVArltw84g==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:zscYCwwm02G6vVArltw84g== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005004Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005004Z +20221111/us-east-1/s3/aws4_request +73433065d5941ec4d2070216c52e356afd17241c6be43c34f50166fe341434e0 +INFO - '2022-11-11' - botocore.auth - Signature: +be8ac3bee95ea2ea4e4c910bf06f68ef9feb51297ac0d32bc8b48044d7baf272 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '4ecCUBZxvumTgmB3qgHskC5oFkoUjt7e9ubyh60lIdphKoRgYhCcKcDrBdLp33hb3hztpl5YH30=', 'x-amz-request-id': 'JYQ9GBP5B0P81AYG', 'Date': 'Fri, 11 Nov 2022 00:50:04 GMT', 'ETag': '"cec7180b0c26d361babd502b96dc3ce2"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180527T000000, start_date=20221111T005003, end_date=20221111T005005 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-05-27T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:50:05.567517Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c439891b-a72d-475d-9367-7b3aac49a997"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..62ba6334 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:49:58.333189Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f00db63c-4b60-3311-bb78-239775d0373d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f00db63c-4b60-3311-bb78-239775d0373d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f6deece3-8540-4bd7-b099-bf0127575c00"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-05-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:49:58.333189+00:00, try_number=1, job_id=579, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-27 00:00:00+00:00 +INFO - Started process 4694 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-05-27T00:00:00+00:00', '--job-id', '579', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpsg3s291w'] +INFO - Job 579: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-27T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499533a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T004959Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T004959Z +20221111/us-east-1/s3/aws4_request +8c00be86c2400db22cf3c25f318b489a3ab9304488aa0c9b90ab8140d2f2cb5f +INFO - '2022-11-11' - botocore.auth - Signature: +f5087b3ca231a643598e01d114004fcc709efd30c4b882bc3c2756991fa1ef8a +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'pvUlzevRQJJolaTZ4XWlZo2//s1hk/Kd7AoA0wCiR/8aboemDRcdEL0bJIDcqZjCc+Ck/Vh5waA=', 'x-amz-request-id': 'WSN1YE56EBY5V7EH', 'Date': 'Fri, 11 Nov 2022 00:49:59 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180527T000000, start_date=20221111T004958, end_date=20221111T005000 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-05-27T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:50:00.525004Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f6deece3-8540-4bd7-b099-bf0127575c00"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..5c0ee19e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:49:52.296164Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f00db63c-4b60-3311-bb78-239775d0373d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f00db63c-4b60-3311-bb78-239775d0373d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "07aea55c-c14c-48f9-9579-1d17a5a8fb65"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-05-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:49:52.296164+00:00, try_number=1, job_id=577, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-27 00:00:00+00:00 +INFO - Started process 4763 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-05-27T00:00:00+00:00', '--job-id', '577', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp5piezhvf'] +INFO - Job 577: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-27T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180527T000000, start_date=20221111T004952, end_date=20221111T005001 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-05-27T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:50:01.321981Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "07aea55c-c14c-48f9-9579-1d17a5a8fb65"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..b89ef7da --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:49:52.334431Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f00db63c-4b60-3311-bb78-239775d0373d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f00db63c-4b60-3311-bb78-239775d0373d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "47a5eae0-4d78-45cb-9d20-c395d0e575b6"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-05-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:49:52.334431+00:00, try_number=1, job_id=578, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-27 00:00:00+00:00 +INFO - Started process 4765 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-05-27T00:00:00+00:00', '--job-id', '578', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpajyh0zv0'] +INFO - Job 578: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-27T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180527T000000, start_date=20221111T004952, end_date=20221111T004955 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-05-27T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:49:55.330263Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "47a5eae0-4d78-45cb-9d20-c395d0e575b6"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..6207d169 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:50:08.512107Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f2ea8d7-63d7-3cf2-a650-34ddae6bdf14"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f2ea8d7-63d7-3cf2-a650-34ddae6bdf14"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "38338be7-f1dc-4684-8cba-c57e123e9812"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-05-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:50:08.512107+00:00, try_number=1, job_id=581, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-28 00:00:00+00:00 +INFO - Started process 4779 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-05-28T00:00:00+00:00', '--job-id', '581', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpr86yn59p'] +INFO - Job 581: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-28T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180528T000000, start_date=20221111T005008, end_date=20221111T005011 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-05-28T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:50:11.896419Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "38338be7-f1dc-4684-8cba-c57e123e9812"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..011e46ce --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:50:09.387625Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f2ea8d7-63d7-3cf2-a650-34ddae6bdf14"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f2ea8d7-63d7-3cf2-a650-34ddae6bdf14"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "93b0d899-9a07-4fc6-b892-1d5db10253e4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-05-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:50:09.387625+00:00, try_number=1, job_id=582, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-28 00:00:00+00:00 +INFO - Started process 4782 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-05-28T00:00:00+00:00', '--job-id', '582', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpy2yp12l6'] +INFO - Job 582: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-28T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180528T000000, start_date=20221111T005009, end_date=20221111T005012 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-05-28T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:50:12.992211Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "93b0d899-9a07-4fc6-b892-1d5db10253e4"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..531462b9 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:50:34.043464Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f2ea8d7-63d7-3cf2-a650-34ddae6bdf14"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f2ea8d7-63d7-3cf2-a650-34ddae6bdf14"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "37cbed65-9931-45cd-af32-21d9b4cc51d1"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-05-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:50:34.043464+00:00, try_number=1, job_id=586, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-28 00:00:00+00:00 +INFO - Started process 4800 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-05-28T00:00:00+00:00', '--job-id', '586', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpys5d8bkg'] +INFO - Job 586: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-28T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'zscYCwwm02G6vVArltw84g==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:zscYCwwm02G6vVArltw84g== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005035Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005035Z +20221111/us-east-1/s3/aws4_request +b6e5dd963d8411f316ddae5fae8776c310b248c7f0bdf184b6df3fce218b4975 +INFO - '2022-11-11' - botocore.auth - Signature: +06bd721547ab517aab9d7fed9812d62968b4fe85903f9e09fc7f581081e4c635 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'hOEza61r7Xdat1y6lGA6M78wOlMB1UNAXXdX5s+ekbjc5cY1Siz9mLQPWfu6nW3/LsayYnqWViY=', 'x-amz-request-id': 'Q6TZMFCKKZFSP6T2', 'Date': 'Fri, 11 Nov 2022 00:50:36 GMT', 'ETag': '"cec7180b0c26d361babd502b96dc3ce2"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180528T000000, start_date=20221111T005034, end_date=20221111T005036 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-05-28T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:50:36.846551Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "37cbed65-9931-45cd-af32-21d9b4cc51d1"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..a73b4307 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:50:24.904609Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f2ea8d7-63d7-3cf2-a650-34ddae6bdf14"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f2ea8d7-63d7-3cf2-a650-34ddae6bdf14"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6512d43a-dceb-4e57-ae93-b6739c8acc40"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-05-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:50:24.904609+00:00, try_number=1, job_id=585, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-28 00:00:00+00:00 +INFO - Started process 4793 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-05-28T00:00:00+00:00', '--job-id', '585', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmphdwi1naf'] +INFO - Job 585: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-28T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50041f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005027Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005027Z +20221111/us-east-1/s3/aws4_request +c2d25c708f1f782345bec318703c955766bcc3d9d6c4299780234ed6b95cda81 +INFO - '2022-11-11' - botocore.auth - Signature: +fb30fccd8460af4fe65c324438e8810ea9d4ec40a4ac9f7e65d09853f3f10a29 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '075A+TA1twbj1tZzWPT9aSFVIcWiytLhrPZOlsAS+OBNyMOUnq3gdyr1GQWcOpGpfcFNzCyy81k=', 'x-amz-request-id': 'SRJ56F6XQ4V4BFTF', 'Date': 'Fri, 11 Nov 2022 00:50:28 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180528T000000, start_date=20221111T005024, end_date=20221111T005029 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-05-28T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:50:29.110085Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6512d43a-dceb-4e57-ae93-b6739c8acc40"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..efdb51d6 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:50:15.560624Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f2ea8d7-63d7-3cf2-a650-34ddae6bdf14"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f2ea8d7-63d7-3cf2-a650-34ddae6bdf14"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "791020c0-65e1-4c82-8df9-1873af670f8a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-05-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:50:15.560624+00:00, try_number=1, job_id=583, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-28 00:00:00+00:00 +INFO - Started process 4706 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-05-28T00:00:00+00:00', '--job-id', '583', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmptqqmkcec'] +INFO - Job 583: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-28T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180528T000000, start_date=20221111T005015, end_date=20221111T005030 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-05-28T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:50:30.149219Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "791020c0-65e1-4c82-8df9-1873af670f8a"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..80a8766a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:50:17.861210Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f2ea8d7-63d7-3cf2-a650-34ddae6bdf14"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f2ea8d7-63d7-3cf2-a650-34ddae6bdf14"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "58389aca-d447-4f76-9481-eb3b872ddd8c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-05-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:50:17.861210+00:00, try_number=1, job_id=584, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-28 00:00:00+00:00 +INFO - Started process 4788 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-05-28T00:00:00+00:00', '--job-id', '584', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpscosh63v'] +INFO - Job 584: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-28T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180528T000000, start_date=20221111T005017, end_date=20221111T005021 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-05-28T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:50:21.721704Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "58389aca-d447-4f76-9481-eb3b872ddd8c"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..e775ed3a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:50:41.261701Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-29T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ec253907-11e1-36e6-b1e7-90be2b01b51f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ec253907-11e1-36e6-b1e7-90be2b01b51f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7a604103-ce7b-43a6-b3c0-1cec1f17e90a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-05-29T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:50:41.261701+00:00, try_number=1, job_id=588, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-29 00:00:00+00:00 +INFO - Started process 4715 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-05-29T00:00:00+00:00', '--job-id', '588', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpvi5b60tz'] +INFO - Job 588: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-29T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-29T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180529T000000, start_date=20221111T005041, end_date=20221111T005044 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-05-29T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:50:44.474956Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7a604103-ce7b-43a6-b3c0-1cec1f17e90a"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..b959b134 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:50:41.238364Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-29T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ec253907-11e1-36e6-b1e7-90be2b01b51f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ec253907-11e1-36e6-b1e7-90be2b01b51f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "20fc9035-581f-440b-967e-6098ec40306e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-05-29T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:50:41.238364+00:00, try_number=1, job_id=587, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-29 00:00:00+00:00 +INFO - Started process 4714 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-05-29T00:00:00+00:00', '--job-id', '587', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpif27eeu7'] +INFO - Job 587: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-29T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-29T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180529T000000, start_date=20221111T005041, end_date=20221111T005044 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-05-29T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:50:44.463618Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "20fc9035-581f-440b-967e-6098ec40306e"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..cb934f70 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:50:57.603863Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-29T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ec253907-11e1-36e6-b1e7-90be2b01b51f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ec253907-11e1-36e6-b1e7-90be2b01b51f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b39b2562-e561-475b-a9f9-c13967636965"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-05-29T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:50:57.603863+00:00, try_number=1, job_id=592, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-29 00:00:00+00:00 +INFO - Started process 4882 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-05-29T00:00:00+00:00', '--job-id', '592', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpjv0903nf'] +INFO - Job 592: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-29T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-29T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '3WSoPw0fzK2CiOsLQkbReQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:3WSoPw0fzK2CiOsLQkbReQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005058Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005058Z +20221111/us-east-1/s3/aws4_request +9d201cd4af7a8c1ee5f71d85bfdb364747dc2a2ee557e9dafbcc531dd9448af8 +INFO - '2022-11-11' - botocore.auth - Signature: +7509534f7b4b8575eb4adebcb1162e2e7b1945fc0c27d88f8e4b666e3c91267c +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '6/xVpxjZihapYeOp4OYmzLeY+y2JVPo8vMZy6Qv5XInLfT/uRSLSER3OJrYXPUBKeFptQ3Y8sZo=', 'x-amz-request-id': '9EBMMCHWZMS20JQR', 'Date': 'Fri, 11 Nov 2022 00:50:58 GMT', 'ETag': '"dd64a83f0d1fccad8288eb0b4246d179"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180529T000000, start_date=20221111T005057, end_date=20221111T005059 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-05-29T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:50:59.505559Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b39b2562-e561-475b-a9f9-c13967636965"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..c29f0ca7 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:50:53.409612Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-29T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ec253907-11e1-36e6-b1e7-90be2b01b51f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ec253907-11e1-36e6-b1e7-90be2b01b51f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a2976976-b6f7-4084-acd0-3004bf904b86"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-05-29T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:50:53.409612+00:00, try_number=1, job_id=591, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-29 00:00:00+00:00 +INFO - Started process 4721 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-05-29T00:00:00+00:00', '--job-id', '591', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpfylb5_m6'] +INFO - Job 591: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-29T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-29T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499501f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005054Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005054Z +20221111/us-east-1/s3/aws4_request +c00a533f9cf5d36a2a6d0fe45da327daafdb2219530e8dd0103120e496c2653d +INFO - '2022-11-11' - botocore.auth - Signature: +11b49d493eb9a0851c547fc78a8e21767f7d3b7e936cc48d9f51b92603c9f4b7 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'OGqP2RXQqoJL5uhKlC63qakvRwMcRBmTL6U0heKl/Lh6sttH0bMGw9aWIQe/Br4gauCmkYlK6k4=', 'x-amz-request-id': '2Y2MWF37K9AHM9C6', 'Date': 'Fri, 11 Nov 2022 00:50:55 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180529T000000, start_date=20221111T005053, end_date=20221111T005056 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-05-29T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:50:56.084084Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a2976976-b6f7-4084-acd0-3004bf904b86"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..ea6cd9c6 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:50:47.061898Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-29T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ec253907-11e1-36e6-b1e7-90be2b01b51f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ec253907-11e1-36e6-b1e7-90be2b01b51f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "06150ea3-1099-4784-a39e-d7c35a5088fc"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-05-29T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:50:47.061898+00:00, try_number=1, job_id=589, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-29 00:00:00+00:00 +INFO - Started process 4873 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-05-29T00:00:00+00:00', '--job-id', '589', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpe3l1vsyl'] +INFO - Job 589: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-29T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-29T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180529T000000, start_date=20221111T005047, end_date=20221111T005055 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-05-29T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:50:55.237891Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "06150ea3-1099-4784-a39e-d7c35a5088fc"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..27266bd5 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:50:47.800317Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-29T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ec253907-11e1-36e6-b1e7-90be2b01b51f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ec253907-11e1-36e6-b1e7-90be2b01b51f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2e7a1463-1fbb-45e9-8723-72f3075b2d19"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-05-29T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:50:47.800317+00:00, try_number=1, job_id=590, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-29 00:00:00+00:00 +INFO - Started process 4876 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-05-29T00:00:00+00:00', '--job-id', '590', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpd00pelec'] +INFO - Job 590: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-29T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-29T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180529T000000, start_date=20221111T005047, end_date=20221111T005050 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-05-29T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:50:50.912842Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2e7a1463-1fbb-45e9-8723-72f3075b2d19"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..965da6da --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:51:01.721674Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-30T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d27c93c1-afce-3e26-b923-a4f397743751"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d27c93c1-afce-3e26-b923-a4f397743751"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d56ccf0e-119e-4e9a-8edd-6bab904ed159"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-05-30T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:51:01.721674+00:00, try_number=1, job_id=594, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-30 00:00:00+00:00 +INFO - Started process 4797 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-05-30T00:00:00+00:00', '--job-id', '594', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpjqkoq1cj'] +INFO - Job 594: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-30T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-30T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180530T000000, start_date=20221111T005101, end_date=20221111T005104 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-05-30T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:51:04.589633Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d56ccf0e-119e-4e9a-8edd-6bab904ed159"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..cad32803 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:51:01.711374Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-30T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d27c93c1-afce-3e26-b923-a4f397743751"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d27c93c1-afce-3e26-b923-a4f397743751"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7e1930ba-96cd-4eab-8f9c-2a8315171079"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-05-30T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:51:01.711374+00:00, try_number=1, job_id=593, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-30 00:00:00+00:00 +INFO - Started process 4795 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-05-30T00:00:00+00:00', '--job-id', '593', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpinmqtdmn'] +INFO - Job 593: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-30T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-30T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180530T000000, start_date=20221111T005101, end_date=20221111T005104 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-05-30T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:51:04.591157Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7e1930ba-96cd-4eab-8f9c-2a8315171079"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..0db7e414 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:51:13.684932Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-30T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d27c93c1-afce-3e26-b923-a4f397743751"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d27c93c1-afce-3e26-b923-a4f397743751"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "57f8ad38-29c4-4939-89c7-26d075a99299"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-05-30T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:51:13.684932+00:00, try_number=1, job_id=598, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-30 00:00:00+00:00 +INFO - Started process 4820 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-05-30T00:00:00+00:00', '--job-id', '598', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpnj08di5g'] +INFO - Job 598: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-30T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-30T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498ef940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'SKoceFXWB+5yZBuipSIZSA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:SKoceFXWB+5yZBuipSIZSA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005114Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005114Z +20221111/us-east-1/s3/aws4_request +fbf5e427c5053f57e0dc8ff0db9ada941f97f40a1098110af6d42ca657b78ba9 +INFO - '2022-11-11' - botocore.auth - Signature: +0db8dc2c4a4febba6f6ca91b14a2666522c075c9ebb547af23e766f44ae16749 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'qnmxlMSfOJe3npY1c3mtv6x/LO/5LljzXzOzlum+vGKTN3CDZoaEqhKF2JC93KJwyTA4eUgQmVE=', 'x-amz-request-id': 'EQND2R449262MMV3', 'Date': 'Fri, 11 Nov 2022 00:51:15 GMT', 'ETag': '"48aa1c7855d607ee72641ba2a5221948"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180530T000000, start_date=20221111T005113, end_date=20221111T005115 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-05-30T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:51:15.778307Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "57f8ad38-29c4-4939-89c7-26d075a99299"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..7a74bb22 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:51:11.389777Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-30T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d27c93c1-afce-3e26-b923-a4f397743751"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d27c93c1-afce-3e26-b923-a4f397743751"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "66f90be7-076b-412a-83c5-b9833f7a1982"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-05-30T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:51:11.389777+00:00, try_number=1, job_id=597, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-30 00:00:00+00:00 +INFO - Started process 4813 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-05-30T00:00:00+00:00', '--job-id', '597', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpauzy0gdo'] +INFO - Job 597: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-30T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-30T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499511f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005112Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005112Z +20221111/us-east-1/s3/aws4_request +b9420c4d9a763379fc7dd2510da5019da1da02c6fe3d19bfa3d6c0faf959150a +INFO - '2022-11-11' - botocore.auth - Signature: +a93d4cf06826a45c8bb810db0b93e40378990dfdee5b801d21e207b5a0bfa45f +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'wKYwTwXwC4Os5oyYJeibME+ru4V1dwtRBEU0DgGLgz3xPV0SKtOwyRrayzLD25AeI4wqnZdt9RY=', 'x-amz-request-id': 'G3V1YJ7SV0HERZHT', 'Date': 'Fri, 11 Nov 2022 00:51:13 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180530T000000, start_date=20221111T005111, end_date=20221111T005113 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-05-30T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:51:13.852568Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "66f90be7-076b-412a-83c5-b9833f7a1982"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..c18cd163 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:51:06.015720Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-30T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d27c93c1-afce-3e26-b923-a4f397743751"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d27c93c1-afce-3e26-b923-a4f397743751"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "31e079d3-7d3e-431f-9bcd-772fdf74d0e5"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-05-30T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:51:06.015720+00:00, try_number=1, job_id=595, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-30 00:00:00+00:00 +INFO - Started process 4806 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-05-30T00:00:00+00:00', '--job-id', '595', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp7j9nnmp3'] +INFO - Job 595: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-30T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-30T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180530T000000, start_date=20221111T005106, end_date=20221111T005111 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-05-30T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:51:11.587431Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "31e079d3-7d3e-431f-9bcd-772fdf74d0e5"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..589d742d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:51:06.029585Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-30T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d27c93c1-afce-3e26-b923-a4f397743751"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d27c93c1-afce-3e26-b923-a4f397743751"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8a00f444-bd1b-4511-9555-b6b28ae7b629"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-05-30T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:51:06.029585+00:00, try_number=1, job_id=596, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-30 00:00:00+00:00 +INFO - Started process 4807 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-05-30T00:00:00+00:00', '--job-id', '596', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpjbzf6tzh'] +INFO - Job 596: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-30T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-30T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180530T000000, start_date=20221111T005106, end_date=20221111T005108 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-05-30T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:51:08.601052Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8a00f444-bd1b-4511-9555-b6b28ae7b629"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..9e3fd5a0 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:51:19.071165Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-31T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "13377716-9c71-3ce8-a1ef-53b01570e5d4"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "13377716-9c71-3ce8-a1ef-53b01570e5d4"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e79014cc-761e-4b73-b133-9616c706badb"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-05-31T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:51:19.071165+00:00, try_number=1, job_id=600, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-31 00:00:00+00:00 +INFO - Started process 4831 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-05-31T00:00:00+00:00', '--job-id', '600', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpkq2ubwpn'] +INFO - Job 600: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-31T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-31T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180531T000000, start_date=20221111T005119, end_date=20221111T005122 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-05-31T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:51:22.273264Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e79014cc-761e-4b73-b133-9616c706badb"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..fb67c6f1 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:51:19.073397Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-31T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "13377716-9c71-3ce8-a1ef-53b01570e5d4"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "13377716-9c71-3ce8-a1ef-53b01570e5d4"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3acaf295-5f5c-4540-9c15-efeb3ee981fa"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-05-31T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:51:19.073397+00:00, try_number=1, job_id=599, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-31 00:00:00+00:00 +INFO - Started process 4830 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-05-31T00:00:00+00:00', '--job-id', '599', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpzfht3qbq'] +INFO - Job 599: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-31T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-31T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180531T000000, start_date=20221111T005119, end_date=20221111T005122 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-05-31T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:51:22.275532Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3acaf295-5f5c-4540-9c15-efeb3ee981fa"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..3bbe454b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:51:35.834151Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-31T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "13377716-9c71-3ce8-a1ef-53b01570e5d4"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "13377716-9c71-3ce8-a1ef-53b01570e5d4"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8ed668e8-5219-4071-8aee-8ece6ed97d3f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-05-31T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:51:35.834151+00:00, try_number=1, job_id=604, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-31 00:00:00+00:00 +INFO - Started process 4909 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-05-31T00:00:00+00:00', '--job-id', '604', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpq_ln8nlz'] +INFO - Job 604: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-31T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-31T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498eff70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'SKoceFXWB+5yZBuipSIZSA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:SKoceFXWB+5yZBuipSIZSA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005136Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005136Z +20221111/us-east-1/s3/aws4_request +48aa5f57a4eaa38474814c3cd89e5bfcf6b3da15c0f640e6ec15fbe9fa736351 +INFO - '2022-11-11' - botocore.auth - Signature: +c376bb4f821dabf7ea160859b52f57013dc17a0521cbd92dd543874767eabf3e +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'WI70jArSvTG2CEYqu/31tppupSdiQ60ffht4mXbrJlOfljtdVcQAoiTS4qUgvqkITdz0+Zs3W5I=', 'x-amz-request-id': 'RB27ZW548ZB2X9AG', 'Date': 'Fri, 11 Nov 2022 00:51:37 GMT', 'ETag': '"48aa1c7855d607ee72641ba2a5221948"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180531T000000, start_date=20221111T005135, end_date=20221111T005137 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-05-31T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:51:37.952613Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8ed668e8-5219-4071-8aee-8ece6ed97d3f"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..26cc56aa --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:51:30.877107Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-31T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "13377716-9c71-3ce8-a1ef-53b01570e5d4"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "13377716-9c71-3ce8-a1ef-53b01570e5d4"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0c9cf03f-912f-4616-8d1c-969daee47a76"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-05-31T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:51:30.877107+00:00, try_number=1, job_id=603, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-31 00:00:00+00:00 +INFO - Started process 4902 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-05-31T00:00:00+00:00', '--job-id', '603', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmps0ykxifk'] +INFO - Job 603: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-31T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-31T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499511f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005131Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005131Z +20221111/us-east-1/s3/aws4_request +7fc5cf2fa092b9b88b549453401d3d90bd13b1addf554b5bcfcb73fec0d5fa8b +INFO - '2022-11-11' - botocore.auth - Signature: +5637d49bd14538e90f62bbfdb56ef075913574fd740f4130f64a2ff87e7c91aa +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '0LHDTbHltAaBNvPQ432EGCKoC87IeTrq2BB/UemEmVoWSSko5LL+I8jtxOy4UxfdhJJS0Ukh9zw=', 'x-amz-request-id': '49BNZRDA3BNFTY87', 'Date': 'Fri, 11 Nov 2022 00:51:32 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180531T000000, start_date=20221111T005130, end_date=20221111T005133 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-05-31T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:51:33.230526Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0c9cf03f-912f-4616-8d1c-969daee47a76"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..c35bc614 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:51:25.034884Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-31T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "13377716-9c71-3ce8-a1ef-53b01570e5d4"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "13377716-9c71-3ce8-a1ef-53b01570e5d4"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "891c3c29-caf4-4b4c-a794-6f81effe1aae"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-05-31T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:51:25.034884+00:00, try_number=1, job_id=602, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-31 00:00:00+00:00 +INFO - Started process 4958 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-05-31T00:00:00+00:00', '--job-id', '602', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpap7lp0n4'] +INFO - Job 602: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-31T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-31T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180531T000000, start_date=20221111T005125, end_date=20221111T005133 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-05-31T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:51:33.704955Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "891c3c29-caf4-4b4c-a794-6f81effe1aae"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..567efb0f --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-05-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:51:25.013814Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-05-31T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "13377716-9c71-3ce8-a1ef-53b01570e5d4"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "13377716-9c71-3ce8-a1ef-53b01570e5d4"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d5c702af-08ee-47d0-a83b-8cabbd645476"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-05-31T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:51:25.013814+00:00, try_number=1, job_id=601, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-05-31 00:00:00+00:00 +INFO - Started process 4955 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-05-31T00:00:00+00:00', '--job-id', '601', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp7m7pip1g'] +INFO - Job 601: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-05-31T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-05-31T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180531T000000, start_date=20221111T005125, end_date=20221111T005128 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-05-31T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:51:28.426856Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d5c702af-08ee-47d0-a83b-8cabbd645476"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..8efb35a9 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:51:40.452212Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7f8497de-e866-3c17-b406-a3f5bbe60b2c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7f8497de-e866-3c17-b406-a3f5bbe60b2c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b2b27564-afa0-4cef-bbd6-e9120b28e973"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-06-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:51:40.452212+00:00, try_number=1, job_id=605, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-01 00:00:00+00:00 +INFO - Started process 4918 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-06-01T00:00:00+00:00', '--job-id', '605', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpqp3f6fs7'] +INFO - Job 605: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180601T000000, start_date=20221111T005140, end_date=20221111T005144 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-06-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:51:44.463013Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b2b27564-afa0-4cef-bbd6-e9120b28e973"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..2f807072 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:51:40.504198Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7f8497de-e866-3c17-b406-a3f5bbe60b2c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7f8497de-e866-3c17-b406-a3f5bbe60b2c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "57e0901c-8ac4-44a0-aeb2-89048b6bb8ce"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-06-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:51:40.504198+00:00, try_number=1, job_id=606, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-01 00:00:00+00:00 +INFO - Started process 4920 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-06-01T00:00:00+00:00', '--job-id', '606', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpfgzy7me_'] +INFO - Job 606: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180601T000000, start_date=20221111T005140, end_date=20221111T005143 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-06-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:51:43.286518Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "57e0901c-8ac4-44a0-aeb2-89048b6bb8ce"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..01bc37f5 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:51:53.753368Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7f8497de-e866-3c17-b406-a3f5bbe60b2c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7f8497de-e866-3c17-b406-a3f5bbe60b2c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "62d2e0c2-36a3-4633-a34d-91de88a4b717"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-06-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:51:53.753368+00:00, try_number=1, job_id=610, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-01 00:00:00+00:00 +INFO - Started process 4938 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-06-01T00:00:00+00:00', '--job-id', '610', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmppor688y2'] +INFO - Job 610: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f2f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'raWYSanY493MuhO0yx4nBA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:raWYSanY493MuhO0yx4nBA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005154Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005154Z +20221111/us-east-1/s3/aws4_request +b0ca6894fa3f05ee1303d0b589196f1544297a556e4d730439dd4ac2d7e2c727 +INFO - '2022-11-11' - botocore.auth - Signature: +b1710d4aa36cc14466590ef388dd9e722c4d0c29d022b7aac36aa604bb298f02 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'wWDM2vdgC335V1ciSlsqQZAQgwNZmbsE/x1k82PsUhDkEKp3dL2ox8E4uCioiR7rlUogRcHSvm0=', 'x-amz-request-id': '07G6XW2NKTQ5JJH1', 'Date': 'Fri, 11 Nov 2022 00:51:55 GMT', 'ETag': '"ada59849a9d8e3ddccba13b4cb1e2704"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180601T000000, start_date=20221111T005153, end_date=20221111T005155 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-06-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:51:55.682318Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "62d2e0c2-36a3-4633-a34d-91de88a4b717"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..9658a1a6 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:51:50.097482Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7f8497de-e866-3c17-b406-a3f5bbe60b2c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7f8497de-e866-3c17-b406-a3f5bbe60b2c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "73ad7cb4-c06b-4341-9ab9-e2df181e3f38"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-06-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:51:50.097482+00:00, try_number=1, job_id=609, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-01 00:00:00+00:00 +INFO - Started process 4930 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-06-01T00:00:00+00:00', '--job-id', '609', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpoe6uahqu'] +INFO - Job 609: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499543a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005150Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005150Z +20221111/us-east-1/s3/aws4_request +e75c46e0a682a14156b1e69844fe63c5ea54c663789c44682bd238b9105df580 +INFO - '2022-11-11' - botocore.auth - Signature: +bf709ae927e38da56e4f99a8dc113120c41614a654bb3ba737f99dc358f04c3e +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'ha6jV2iIBekYWm6NfLo9HhIOZV3mM8e4MHqtqRU4lbT6eXfeJkd4sBnkPMyEifc18xB7o2h1Y2c=', 'x-amz-request-id': 'WGMFEH3TB5WZDR2R', 'Date': 'Fri, 11 Nov 2022 00:51:51 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180601T000000, start_date=20221111T005150, end_date=20221111T005152 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-06-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:51:52.205864Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "73ad7cb4-c06b-4341-9ab9-e2df181e3f38"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..d4fbb381 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:51:46.149015Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7f8497de-e866-3c17-b406-a3f5bbe60b2c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7f8497de-e866-3c17-b406-a3f5bbe60b2c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "17e65814-e436-420c-8814-1eaa2a149071"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-06-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:51:46.149015+00:00, try_number=1, job_id=608, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-01 00:00:00+00:00 +INFO - Started process 4926 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-06-01T00:00:00+00:00', '--job-id', '608', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmprigmodv0'] +INFO - Job 608: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180601T000000, start_date=20221111T005146, end_date=20221111T005151 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-06-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:51:51.979488Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "17e65814-e436-420c-8814-1eaa2a149071"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..35c7e955 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:51:45.553660Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7f8497de-e866-3c17-b406-a3f5bbe60b2c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7f8497de-e866-3c17-b406-a3f5bbe60b2c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "df206569-3c3c-4439-bf2a-7dae6743cdc5"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-06-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:51:45.553660+00:00, try_number=1, job_id=607, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-01 00:00:00+00:00 +INFO - Started process 5029 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-06-01T00:00:00+00:00', '--job-id', '607', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp67a9ni__'] +INFO - Job 607: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180601T000000, start_date=20221111T005145, end_date=20221111T005148 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-06-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:51:48.141365Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "df206569-3c3c-4439-bf2a-7dae6743cdc5"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..325a8380 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:51:57.799060Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "faf5ffe6-7fed-3574-ad2f-732f52355dfd"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "faf5ffe6-7fed-3574-ad2f-732f52355dfd"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "35f402fa-cc48-4e1d-869a-94018c0b855d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-06-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:51:57.799060+00:00, try_number=1, job_id=611, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-02 00:00:00+00:00 +INFO - Started process 4967 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-06-02T00:00:00+00:00', '--job-id', '611', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpq5mq4tmo'] +INFO - Job 611: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180602T000000, start_date=20221111T005157, end_date=20221111T005200 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-06-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:52:00.963428Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "35f402fa-cc48-4e1d-869a-94018c0b855d"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..556d2ae9 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:51:57.933198Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "faf5ffe6-7fed-3574-ad2f-732f52355dfd"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "faf5ffe6-7fed-3574-ad2f-732f52355dfd"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "448f0e86-9d7b-453f-bfde-c031325b7855"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-06-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:51:57.933198+00:00, try_number=1, job_id=612, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-02 00:00:00+00:00 +INFO - Started process 4972 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-06-02T00:00:00+00:00', '--job-id', '612', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpwlvax1ai'] +INFO - Job 612: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180602T000000, start_date=20221111T005157, end_date=20221111T005201 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-06-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:52:01.043474Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "448f0e86-9d7b-453f-bfde-c031325b7855"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..2899d55f --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:52:10.376494Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "faf5ffe6-7fed-3574-ad2f-732f52355dfd"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "faf5ffe6-7fed-3574-ad2f-732f52355dfd"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f7a30769-18ab-4120-9fd6-1fd62ddbe937"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-06-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:52:10.376494+00:00, try_number=1, job_id=616, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-02 00:00:00+00:00 +INFO - Started process 5020 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-06-02T00:00:00+00:00', '--job-id', '616', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp6njq9r2h'] +INFO - Job 616: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f1f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'raWYSanY493MuhO0yx4nBA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:raWYSanY493MuhO0yx4nBA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005211Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005211Z +20221111/us-east-1/s3/aws4_request +950921dd5e18b62143dd77c1a182f1acaf214b8d0fffd5a48074f0b22f9d6e6d +INFO - '2022-11-11' - botocore.auth - Signature: +3382f2841658ec80837605f82dd6849741e709f460a0823939a3c39ab6bb7aa1 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'rLSvX/Fy8wSEY8vRwvnLjB/mMYkXoOPVFywvs3KqunhiVQ0hGPGib+YOQDc/Y17AlhAnHLiiyLE=', 'x-amz-request-id': 'N9K60DTBPWNAK39P', 'Date': 'Fri, 11 Nov 2022 00:52:11 GMT', 'ETag': '"ada59849a9d8e3ddccba13b4cb1e2704"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180602T000000, start_date=20221111T005210, end_date=20221111T005212 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-06-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:52:12.346396Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f7a30769-18ab-4120-9fd6-1fd62ddbe937"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..cc138101 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:52:07.695152Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "faf5ffe6-7fed-3574-ad2f-732f52355dfd"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "faf5ffe6-7fed-3574-ad2f-732f52355dfd"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "21dbb012-03a6-4ee3-a8a9-0934b1c7b09f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-06-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:52:07.695152+00:00, try_number=1, job_id=615, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-02 00:00:00+00:00 +INFO - Started process 5043 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-06-02T00:00:00+00:00', '--job-id', '615', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp_mdmjxmp'] +INFO - Job 615: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50071f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005208Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005208Z +20221111/us-east-1/s3/aws4_request +69071e1b5f1db60a11df54287f24b1183b5aabaacc76b41bed60dc000a39c711 +INFO - '2022-11-11' - botocore.auth - Signature: +1b7947fab784575dec4d8b48f1221a937895ccfcc2434c5ce07ce7cfa32d21b8 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'uPL4N3QN2GlgspAU+ce5ZvCwuHfxospTIEG21iQROs4Cs0Tv54wkOpeBl2miAf4hUkUYFzsUgI4=', 'x-amz-request-id': 'FYN1DP97TD4Y1556', 'Date': 'Fri, 11 Nov 2022 00:52:08 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180602T000000, start_date=20221111T005207, end_date=20221111T005209 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-06-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:52:09.660097Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "21dbb012-03a6-4ee3-a8a9-0934b1c7b09f"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..698f3161 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:52:02.789139Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "faf5ffe6-7fed-3574-ad2f-732f52355dfd"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "faf5ffe6-7fed-3574-ad2f-732f52355dfd"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0c85594f-09e3-4cba-8325-aa0cac4ed813"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-06-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:52:02.789139+00:00, try_number=1, job_id=613, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-02 00:00:00+00:00 +INFO - Started process 5036 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-06-02T00:00:00+00:00', '--job-id', '613', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp6skn99qq'] +INFO - Job 613: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180602T000000, start_date=20221111T005202, end_date=20221111T005208 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-06-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:52:08.443471Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0c85594f-09e3-4cba-8325-aa0cac4ed813"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..4d7de997 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:52:02.804753Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "faf5ffe6-7fed-3574-ad2f-732f52355dfd"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "faf5ffe6-7fed-3574-ad2f-732f52355dfd"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "17ef19e3-763d-453a-b505-2bb38920c5f8"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-06-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:52:02.804753+00:00, try_number=1, job_id=614, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-02 00:00:00+00:00 +INFO - Started process 5038 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-06-02T00:00:00+00:00', '--job-id', '614', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp99c2qofe'] +INFO - Job 614: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180602T000000, start_date=20221111T005202, end_date=20221111T005205 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-06-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:52:05.733795Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "17ef19e3-763d-453a-b505-2bb38920c5f8"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..146bfa77 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:52:14.704381Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cdfd8af9-6ccd-3e82-a9b7-a2839fa1d4d8"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cdfd8af9-6ccd-3e82-a9b7-a2839fa1d4d8"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "40b550eb-6d6e-420d-ab3c-ce0c2ccb3d02"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-06-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:52:14.704381+00:00, try_number=1, job_id=618, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-03 00:00:00+00:00 +INFO - Started process 5088 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-06-03T00:00:00+00:00', '--job-id', '618', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpfem9bidl'] +INFO - Job 618: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180603T000000, start_date=20221111T005214, end_date=20221111T005217 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-06-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:52:17.704040Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "40b550eb-6d6e-420d-ab3c-ce0c2ccb3d02"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..d65c3d9a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:52:14.577857Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cdfd8af9-6ccd-3e82-a9b7-a2839fa1d4d8"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cdfd8af9-6ccd-3e82-a9b7-a2839fa1d4d8"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "24c2354f-5ad4-4805-b59f-f40bab99aa52"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-06-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:52:14.577857+00:00, try_number=1, job_id=617, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-03 00:00:00+00:00 +INFO - Started process 5085 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-06-03T00:00:00+00:00', '--job-id', '617', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp_etpod4q'] +INFO - Job 617: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180603T000000, start_date=20221111T005214, end_date=20221111T005217 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-06-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:52:17.743930Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "24c2354f-5ad4-4805-b59f-f40bab99aa52"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..543ce986 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:52:26.328460Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cdfd8af9-6ccd-3e82-a9b7-a2839fa1d4d8"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cdfd8af9-6ccd-3e82-a9b7-a2839fa1d4d8"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1b9e1a2b-0de5-4cc5-85b9-b3c493dd5e94"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-06-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:52:26.328460+00:00, try_number=1, job_id=622, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-03 00:00:00+00:00 +INFO - Started process 5043 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-06-03T00:00:00+00:00', '--job-id', '622', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmprwuov_wr'] +INFO - Job 622: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f1f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '2omT8nzAoRhM+kNFW3NW+g==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:2omT8nzAoRhM+kNFW3NW+g== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005227Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005227Z +20221111/us-east-1/s3/aws4_request +a5a7206e5070189935e9c4518db36242169d6799d631274c028b23c9ee31c617 +INFO - '2022-11-11' - botocore.auth - Signature: +df541c023f61a3902d8ca5dfbb0340510e45b9cada8328fb087256bc65f1768e +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'yl+Tizc1fSFANMUg+UO2VoWqwJlLb52I5SCONxlCpQZxaU34sqH2kHOLejYQ7hFCOVnDcCZ+v4w=', 'x-amz-request-id': 'M96ZH85KX75RPM5P', 'Date': 'Fri, 11 Nov 2022 00:52:27 GMT', 'ETag': '"da8993f27cc0a1184cfa43455b7356fa"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180603T000000, start_date=20221111T005226, end_date=20221111T005228 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-06-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:52:28.237452Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1b9e1a2b-0de5-4cc5-85b9-b3c493dd5e94"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..a5f86ffd --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:52:24.777159Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cdfd8af9-6ccd-3e82-a9b7-a2839fa1d4d8"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cdfd8af9-6ccd-3e82-a9b7-a2839fa1d4d8"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "eccd2509-f3c6-43a5-9d30-e0c8cfb72444"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-06-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:52:24.777159+00:00, try_number=1, job_id=621, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-03 00:00:00+00:00 +INFO - Started process 5038 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-06-03T00:00:00+00:00', '--job-id', '621', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpjn6g0pmo'] +INFO - Job 621: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005225Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005225Z +20221111/us-east-1/s3/aws4_request +ec02bf7e8693192b406fab8d0257822e8924b9094de29fde9b63a35e371b2ebd +INFO - '2022-11-11' - botocore.auth - Signature: +3729f13a43487e25c90736c6de24edb8426b67c996c6f10a92a96ae04db7116e +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'VkyQvLnVlV1ZXuo6MmGtAVEgnUp2lC643vFEgKB957fmqda175AQmD0ejPDbwWEv0k85CGldVhY=', 'x-amz-request-id': 'AW56SXTMKQSKJW93', 'Date': 'Fri, 11 Nov 2022 00:52:26 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180603T000000, start_date=20221111T005224, end_date=20221111T005227 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-06-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:52:27.076019Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "eccd2509-f3c6-43a5-9d30-e0c8cfb72444"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..6744e9df --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:52:19.706292Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cdfd8af9-6ccd-3e82-a9b7-a2839fa1d4d8"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cdfd8af9-6ccd-3e82-a9b7-a2839fa1d4d8"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "49aa0cb5-a583-40b4-b3eb-128c86370656"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-06-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:52:19.706292+00:00, try_number=1, job_id=619, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-03 00:00:00+00:00 +INFO - Started process 5029 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-06-03T00:00:00+00:00', '--job-id', '619', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpwve7iy50'] +INFO - Job 619: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180603T000000, start_date=20221111T005219, end_date=20221111T005224 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-06-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:52:24.638880Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "49aa0cb5-a583-40b4-b3eb-128c86370656"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..93cbf329 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:52:19.761583Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cdfd8af9-6ccd-3e82-a9b7-a2839fa1d4d8"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cdfd8af9-6ccd-3e82-a9b7-a2839fa1d4d8"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "370f2ee0-28b9-4852-8662-850c6b8781ea"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-06-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:52:19.761583+00:00, try_number=1, job_id=620, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-03 00:00:00+00:00 +INFO - Started process 5031 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-06-03T00:00:00+00:00', '--job-id', '620', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp76zpx141'] +INFO - Job 620: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180603T000000, start_date=20221111T005219, end_date=20221111T005222 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-06-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:52:22.902044Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "370f2ee0-28b9-4852-8662-850c6b8781ea"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..a22d6279 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:52:31.080878Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1dde33c8-f41a-3912-87a3-78bbbf842c34"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1dde33c8-f41a-3912-87a3-78bbbf842c34"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8df12858-718f-4a56-948c-d3497df4376f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-06-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:52:31.080878+00:00, try_number=1, job_id=623, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-04 00:00:00+00:00 +INFO - Started process 5094 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-06-04T00:00:00+00:00', '--job-id', '623', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpnpmry83y'] +INFO - Job 623: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180604T000000, start_date=20221111T005231, end_date=20221111T005234 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-06-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:52:34.902504Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8df12858-718f-4a56-948c-d3497df4376f"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..46f232ba --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:52:31.093097Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1dde33c8-f41a-3912-87a3-78bbbf842c34"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1dde33c8-f41a-3912-87a3-78bbbf842c34"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4bb60a01-b7c4-4da0-90a5-74925f1d6d17"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-06-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:52:31.093097+00:00, try_number=1, job_id=624, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-04 00:00:00+00:00 +INFO - Started process 5096 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-06-04T00:00:00+00:00', '--job-id', '624', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpzrtagnl9'] +INFO - Job 624: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180604T000000, start_date=20221111T005231, end_date=20221111T005234 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-06-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:52:34.943154Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4bb60a01-b7c4-4da0-90a5-74925f1d6d17"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..f983f78e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:52:45.611587Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1dde33c8-f41a-3912-87a3-78bbbf842c34"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1dde33c8-f41a-3912-87a3-78bbbf842c34"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5da2dfde-3a93-4e35-a832-8288cf285fb5"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-06-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:52:45.611587+00:00, try_number=1, job_id=628, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-04 00:00:00+00:00 +INFO - Started process 5173 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-06-04T00:00:00+00:00', '--job-id', '628', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpixx973pe'] +INFO - Job 628: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6ee0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'khyiklmHdaa/J8G1VWGnYA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:khyiklmHdaa/J8G1VWGnYA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005247Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005247Z +20221111/us-east-1/s3/aws4_request +496486a0c5712580c855729ba60cfbcedd65e7e4b376e55a4aee19d54f3001f6 +INFO - '2022-11-11' - botocore.auth - Signature: +e7b581288a8a9b37067cc3ba6e3e710b1e0be733400e89d9437b0c34af00bf48 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 's9Jdl3AxcC8yg7KpBN5oWc7oESDLRj8D7ZjwnduVbSIXCJdtKbbKiP4hdun5DBYC5MrcCLaOnI4=', 'x-amz-request-id': 'HQJR21VVPYSWRBFX', 'Date': 'Fri, 11 Nov 2022 00:52:49 GMT', 'ETag': '"921ca292598775a6bf27c1b55561a760"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180604T000000, start_date=20221111T005245, end_date=20221111T005249 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-06-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:52:49.917037Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5da2dfde-3a93-4e35-a832-8288cf285fb5"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..dc36b1c3 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:52:41.965331Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1dde33c8-f41a-3912-87a3-78bbbf842c34"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1dde33c8-f41a-3912-87a3-78bbbf842c34"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5d944914-7c9f-47a4-bf34-60514b50e495"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-06-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:52:41.965331+00:00, try_number=1, job_id=627, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-04 00:00:00+00:00 +INFO - Started process 5138 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-06-04T00:00:00+00:00', '--job-id', '627', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmps3r6fod8'] +INFO - Job 627: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50073a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005243Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005243Z +20221111/us-east-1/s3/aws4_request +c968dff984f0d5119b72958e8200af17cd63e9f068a79d898a7ed11fea4313db +INFO - '2022-11-11' - botocore.auth - Signature: +d6a8c54a2bd979a8ea1cf1692378e1e574a9c384b17879b31d97dca234d4cedb +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'qYtnHjY+KwaBEOMQmXnRQPhnme0ksmYBO/BNisekqdoChf+xwSkruMvDuehQaINtgOuI49tAe2M=', 'x-amz-request-id': 'D0YQ8DM6KX4M8R1V', 'Date': 'Fri, 11 Nov 2022 00:52:44 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180604T000000, start_date=20221111T005241, end_date=20221111T005244 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-06-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:52:44.680696Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5d944914-7c9f-47a4-bf34-60514b50e495"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..7d5ba568 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:52:37.036984Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1dde33c8-f41a-3912-87a3-78bbbf842c34"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1dde33c8-f41a-3912-87a3-78bbbf842c34"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bb0909c7-016b-41a4-86be-6d084677a262"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-06-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:52:37.036984+00:00, try_number=1, job_id=626, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-04 00:00:00+00:00 +INFO - Started process 5130 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-06-04T00:00:00+00:00', '--job-id', '626', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpa1y3okt6'] +INFO - Job 626: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180604T000000, start_date=20221111T005237, end_date=20221111T005243 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-06-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:52:43.770359Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bb0909c7-016b-41a4-86be-6d084677a262"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..53bce694 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:52:37.019405Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1dde33c8-f41a-3912-87a3-78bbbf842c34"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1dde33c8-f41a-3912-87a3-78bbbf842c34"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c01f8c7d-b186-4532-9324-b51993c132ab"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-06-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:52:37.019405+00:00, try_number=1, job_id=625, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-04 00:00:00+00:00 +INFO - Started process 5129 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-06-04T00:00:00+00:00', '--job-id', '625', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpns0viidu'] +INFO - Job 625: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180604T000000, start_date=20221111T005237, end_date=20221111T005239 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-06-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:52:39.977299Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c01f8c7d-b186-4532-9324-b51993c132ab"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..25bba977 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:52:52.278248Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0ba8b592-acf3-31f6-89a3-8d2b042a1243"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0ba8b592-acf3-31f6-89a3-8d2b042a1243"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "35a94a5a-c4c6-45d5-bc09-0e47c946bf2f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-06-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:52:52.278248+00:00, try_number=1, job_id=629, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-05 00:00:00+00:00 +INFO - Started process 5128 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-06-05T00:00:00+00:00', '--job-id', '629', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpv1qwqsv_'] +INFO - Job 629: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180605T000000, start_date=20221111T005252, end_date=20221111T005255 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-06-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:52:55.039128Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "35a94a5a-c4c6-45d5-bc09-0e47c946bf2f"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..3e15e5ed --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:52:52.285648Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0ba8b592-acf3-31f6-89a3-8d2b042a1243"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0ba8b592-acf3-31f6-89a3-8d2b042a1243"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "98d7d4c4-e6c9-4f6b-942d-ac4a66ce6989"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-06-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:52:52.285648+00:00, try_number=1, job_id=630, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-05 00:00:00+00:00 +INFO - Started process 5130 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-06-05T00:00:00+00:00', '--job-id', '630', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpb_m_ioj9'] +INFO - Job 630: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180605T000000, start_date=20221111T005252, end_date=20221111T005254 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-06-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:52:54.949930Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "98d7d4c4-e6c9-4f6b-942d-ac4a66ce6989"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..7290a255 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:53:05.235423Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0ba8b592-acf3-31f6-89a3-8d2b042a1243"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0ba8b592-acf3-31f6-89a3-8d2b042a1243"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2989c3cd-a3d2-4986-9730-55abd49b70e6"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-06-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:53:05.235423+00:00, try_number=1, job_id=634, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-05 00:00:00+00:00 +INFO - Started process 5208 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-06-05T00:00:00+00:00', '--job-id', '634', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpv8noyzq1'] +INFO - Job 634: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0ee0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '2omT8nzAoRhM+kNFW3NW+g==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:2omT8nzAoRhM+kNFW3NW+g== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005306Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005306Z +20221111/us-east-1/s3/aws4_request +124c2f0c767a31c7613ed918614773e1d5f1898e42e2bac572c1e74578d8a257 +INFO - '2022-11-11' - botocore.auth - Signature: +939b6d0f1d385835e35d5312132b9d33bb8f759971926bfe8331a42abafae586 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'T/4rIjgFJvUfPjaJW2sACIWuOTMECFN0WGwiq6kvEWMFHz2WKI9bc8YoyUfpFXQ7XY0yjyz5Ytc=', 'x-amz-request-id': 'FP5848D2M5RQGN82', 'Date': 'Fri, 11 Nov 2022 00:53:06 GMT', 'ETag': '"da8993f27cc0a1184cfa43455b7356fa"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180605T000000, start_date=20221111T005305, end_date=20221111T005307 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-06-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:53:07.217758Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2989c3cd-a3d2-4986-9730-55abd49b70e6"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..5943be88 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:53:01.776301Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0ba8b592-acf3-31f6-89a3-8d2b042a1243"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0ba8b592-acf3-31f6-89a3-8d2b042a1243"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "59003cdc-4cad-4aee-8b80-3e9fb2062238"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-06-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:53:01.776301+00:00, try_number=1, job_id=633, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-05 00:00:00+00:00 +INFO - Started process 5171 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-06-05T00:00:00+00:00', '--job-id', '633', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp3r5zk972'] +INFO - Job 633: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499543a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005302Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005302Z +20221111/us-east-1/s3/aws4_request +1969b78fb9d3e2ff31d155a96c4ee6ae8d999df2fc7065df35103636a2bade5c +INFO - '2022-11-11' - botocore.auth - Signature: +15e83de8d958f44943248c0d4480b783f4bc877e36266356acfed701932f0d07 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'UrzXEKqSsxtAoj1bJcn/9nCHP7Hg6It7SQQd+hZw3R8x7HpCIurkGc3vW3+r5kAZ2AW+JiT+Wqs=', 'x-amz-request-id': 'WRSS6WEB7HWXF04K', 'Date': 'Fri, 11 Nov 2022 00:53:03 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180605T000000, start_date=20221111T005301, end_date=20221111T005303 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-06-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:53:03.992873Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "59003cdc-4cad-4aee-8b80-3e9fb2062238"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..779148fe --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:52:56.790269Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0ba8b592-acf3-31f6-89a3-8d2b042a1243"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0ba8b592-acf3-31f6-89a3-8d2b042a1243"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "936b7b17-cf3a-4e7d-b428-04484b7c327c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-06-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:52:56.790269+00:00, try_number=1, job_id=631, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-05 00:00:00+00:00 +INFO - Started process 5216 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-06-05T00:00:00+00:00', '--job-id', '631', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmphiqwde0y'] +INFO - Job 631: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180605T000000, start_date=20221111T005256, end_date=20221111T005303 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-06-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:53:03.347976Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "936b7b17-cf3a-4e7d-b428-04484b7c327c"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..396a5ebb --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:52:56.794058Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0ba8b592-acf3-31f6-89a3-8d2b042a1243"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0ba8b592-acf3-31f6-89a3-8d2b042a1243"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a8a17466-65cb-4300-b01a-a5dbcc44e663"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-06-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:52:56.794058+00:00, try_number=1, job_id=632, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-05 00:00:00+00:00 +INFO - Started process 5219 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-06-05T00:00:00+00:00', '--job-id', '632', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpghpz_c1j'] +INFO - Job 632: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180605T000000, start_date=20221111T005256, end_date=20221111T005259 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-06-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:52:59.535206Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a8a17466-65cb-4300-b01a-a5dbcc44e663"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..8a107e85 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:53:09.115236Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7b1ce2f5-81d0-3ab5-8e28-26937ce2c3f5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7b1ce2f5-81d0-3ab5-8e28-26937ce2c3f5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "06807a47-bafa-4913-a239-43ded5176040"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-06-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:53:09.115236+00:00, try_number=1, job_id=636, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-06 00:00:00+00:00 +INFO - Started process 5227 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-06-06T00:00:00+00:00', '--job-id', '636', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpw_igxdoe'] +INFO - Job 636: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180606T000000, start_date=20221111T005309, end_date=20221111T005311 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-06-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:53:11.818829Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "06807a47-bafa-4913-a239-43ded5176040"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..f2d6c76f --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:53:09.117352Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7b1ce2f5-81d0-3ab5-8e28-26937ce2c3f5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7b1ce2f5-81d0-3ab5-8e28-26937ce2c3f5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "91cba8b5-82d2-457d-8316-58c541dd97cf"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-06-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:53:09.117352+00:00, try_number=1, job_id=635, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-06 00:00:00+00:00 +INFO - Started process 5229 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-06-06T00:00:00+00:00', '--job-id', '635', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmphtwfmqfb'] +INFO - Job 635: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180606T000000, start_date=20221111T005309, end_date=20221111T005311 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-06-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:53:11.931537Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "91cba8b5-82d2-457d-8316-58c541dd97cf"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..0ed8458b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:53:23.118326Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7b1ce2f5-81d0-3ab5-8e28-26937ce2c3f5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7b1ce2f5-81d0-3ab5-8e28-26937ce2c3f5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6dd3cfcd-aa6f-48ea-8310-4fe5e1da183f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-06-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:53:23.118326+00:00, try_number=1, job_id=640, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-06 00:00:00+00:00 +INFO - Started process 5300 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-06-06T00:00:00+00:00', '--job-id', '640', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp6qwvbx6c'] +INFO - Job 640: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'qn388bYjzKUwVMdahvmS8g==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:qn388bYjzKUwVMdahvmS8g== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005323Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005323Z +20221111/us-east-1/s3/aws4_request +ef29a74c7f27a1386a18b177e026d83eb79d6875cc41e7ee8c0bd79d2c9f9fa8 +INFO - '2022-11-11' - botocore.auth - Signature: +4fd2932f03124107177d5f8931b62d7bf80cc1bffa68c3a0bbf5a1617e9163b5 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'g8nMlbOOdwH4bPg+r7iKPhdW7XJDy/+JpcKFYhYNE+NmEuNSQiiDw2wfwDFPDQuBsFOQdKRPyg0=', 'x-amz-request-id': 'ABKTQM054AD2QYKC', 'Date': 'Fri, 11 Nov 2022 00:53:24 GMT', 'ETag': '"aa7dfcf1b623cca53054c75a86f992f2"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180606T000000, start_date=20221111T005323, end_date=20221111T005325 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-06-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:53:25.000574Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6dd3cfcd-aa6f-48ea-8310-4fe5e1da183f"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..e60fefc1 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:53:19.314679Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7b1ce2f5-81d0-3ab5-8e28-26937ce2c3f5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7b1ce2f5-81d0-3ab5-8e28-26937ce2c3f5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2e7f25e9-9125-4ccb-b6b0-73367de881e6"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-06-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:53:19.314679+00:00, try_number=1, job_id=639, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-06 00:00:00+00:00 +INFO - Started process 5224 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-06-06T00:00:00+00:00', '--job-id', '639', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpajohazot'] +INFO - Job 639: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499523a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005320Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005320Z +20221111/us-east-1/s3/aws4_request +0e96fa09f4ef1296412b7a20bc5753d41b96f6620b9552cfa3398a725893e082 +INFO - '2022-11-11' - botocore.auth - Signature: +60e1924b435ed3f9c92d3db62b7c491d1d385213aff4bfcccba9b36f84af19b8 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'Z5ALiujnyj3tjc4IxU3rlUd5omIBq11kwtqDeTs8SDjhbVKbiB1NwaOi2mGkM/B4qCxBirdbdMk=', 'x-amz-request-id': 'VPAGT3YY4WFMT9QF', 'Date': 'Fri, 11 Nov 2022 00:53:21 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180606T000000, start_date=20221111T005319, end_date=20221111T005321 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-06-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:53:21.845592Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2e7f25e9-9125-4ccb-b6b0-73367de881e6"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..44ba73ea --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:53:14.813975Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7b1ce2f5-81d0-3ab5-8e28-26937ce2c3f5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7b1ce2f5-81d0-3ab5-8e28-26937ce2c3f5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "dd80efdf-fb48-4ab8-aa85-7cc6993e1e90"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-06-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:53:14.813975+00:00, try_number=1, job_id=638, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-06 00:00:00+00:00 +INFO - Started process 5219 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-06-06T00:00:00+00:00', '--job-id', '638', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpe4ukggmr'] +INFO - Job 638: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180606T000000, start_date=20221111T005314, end_date=20221111T005321 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-06-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:53:21.686260Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "dd80efdf-fb48-4ab8-aa85-7cc6993e1e90"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..860ff841 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:53:14.757960Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7b1ce2f5-81d0-3ab5-8e28-26937ce2c3f5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "7b1ce2f5-81d0-3ab5-8e28-26937ce2c3f5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f1da7d79-e2b2-4476-ba97-14b51c5a9745"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-06-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:53:14.757960+00:00, try_number=1, job_id=637, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-06 00:00:00+00:00 +INFO - Started process 5216 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-06-06T00:00:00+00:00', '--job-id', '637', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp79z0jnqz'] +INFO - Job 637: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180606T000000, start_date=20221111T005314, end_date=20221111T005317 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-06-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:53:17.434558Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f1da7d79-e2b2-4476-ba97-14b51c5a9745"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..2b697730 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:53:27.186156Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ecb2a6d6-2282-3fe7-9054-c7c8b7afc676"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ecb2a6d6-2282-3fe7-9054-c7c8b7afc676"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6dc578c5-4a23-4552-9210-d424a8189525"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-06-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:53:27.186156+00:00, try_number=1, job_id=642, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-07 00:00:00+00:00 +INFO - Started process 5310 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-06-07T00:00:00+00:00', '--job-id', '642', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp_7y4qnts'] +INFO - Job 642: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180607T000000, start_date=20221111T005327, end_date=20221111T005330 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-06-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:53:30.386811Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6dc578c5-4a23-4552-9210-d424a8189525"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..5cd7691f --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:53:27.183996Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ecb2a6d6-2282-3fe7-9054-c7c8b7afc676"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ecb2a6d6-2282-3fe7-9054-c7c8b7afc676"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d9b0c55a-7bb6-4038-b3bd-df1c52553aca"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-06-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:53:27.183996+00:00, try_number=1, job_id=641, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-07 00:00:00+00:00 +INFO - Started process 5311 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-06-07T00:00:00+00:00', '--job-id', '641', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpuklx3z8_'] +INFO - Job 641: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180607T000000, start_date=20221111T005327, end_date=20221111T005330 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-06-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:53:30.458724Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d9b0c55a-7bb6-4038-b3bd-df1c52553aca"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..f562a84a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:53:39.861521Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ecb2a6d6-2282-3fe7-9054-c7c8b7afc676"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ecb2a6d6-2282-3fe7-9054-c7c8b7afc676"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f1bc537d-d446-4e5b-9b15-5c56c2a39acd"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-06-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:53:39.861521+00:00, try_number=1, job_id=646, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-07 00:00:00+00:00 +INFO - Started process 5314 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-06-07T00:00:00+00:00', '--job-id', '646', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp0ctuwuo6'] +INFO - Job 646: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'SMmN1Vb224q+imJ7RT57VQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:SMmN1Vb224q+imJ7RT57VQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005340Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005340Z +20221111/us-east-1/s3/aws4_request +bd606c13804f97f18deada8c2fc83abc66a1d5b455c2d6f3f4b075fb6b38e513 +INFO - '2022-11-11' - botocore.auth - Signature: +3879dc5282f4345f97a69672913fa8b03cf0084438888bd4400101e97ef55a45 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '6DqenF7SrDUpcS0MFnJveVzMqIN+Q5A3Cox0j8S2EyKfKzN0XMTU19aQ/56D0EV2WvhXUgrWZ6A=', 'x-amz-request-id': '0S4NMB15742SPD9B', 'Date': 'Fri, 11 Nov 2022 00:53:41 GMT', 'ETag': '"48c98dd556f6db8abe8a627b453e7b55"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180607T000000, start_date=20221111T005339, end_date=20221111T005341 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-06-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:53:41.710052Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f1bc537d-d446-4e5b-9b15-5c56c2a39acd"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..57e112c0 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:53:37.494790Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ecb2a6d6-2282-3fe7-9054-c7c8b7afc676"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ecb2a6d6-2282-3fe7-9054-c7c8b7afc676"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5236d3c4-9e4e-45be-b350-78d4769eeccc"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-06-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:53:37.494790+00:00, try_number=1, job_id=645, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-07 00:00:00+00:00 +INFO - Started process 5306 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-06-07T00:00:00+00:00', '--job-id', '645', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpe8e77kr9'] +INFO - Job 645: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499543a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005338Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005338Z +20221111/us-east-1/s3/aws4_request +9f26a63c3caed99455db91c6b8edbc25de8e968483d3c132a87e212fd38b3bb1 +INFO - '2022-11-11' - botocore.auth - Signature: +65c3a3bb82452388b3cde0bb9e4b42de1e2a26c386e08674a7e84516bda4cdff +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'AaAc5yRDG4W6f5NxhS3bAsIPx31K7ru7eQaYVrFchNyNvpm0rCSa6KZAvAzpQFHBD9pGDUBTJ1c=', 'x-amz-request-id': 'D0CYV3ZDK8J0W45S', 'Date': 'Fri, 11 Nov 2022 00:53:38 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180607T000000, start_date=20221111T005337, end_date=20221111T005339 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-06-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:53:39.527899Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5236d3c4-9e4e-45be-b350-78d4769eeccc"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..f7479eb2 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:53:32.251465Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ecb2a6d6-2282-3fe7-9054-c7c8b7afc676"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ecb2a6d6-2282-3fe7-9054-c7c8b7afc676"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6f3e07d0-10ec-4b12-9784-40f55773aeef"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-06-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:53:32.251465+00:00, try_number=1, job_id=643, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-07 00:00:00+00:00 +INFO - Started process 5266 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-06-07T00:00:00+00:00', '--job-id', '643', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpr52p7tnj'] +INFO - Job 643: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180607T000000, start_date=20221111T005332, end_date=20221111T005338 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-06-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:53:38.055860Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6f3e07d0-10ec-4b12-9784-40f55773aeef"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..e522f971 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:53:32.264425Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ecb2a6d6-2282-3fe7-9054-c7c8b7afc676"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ecb2a6d6-2282-3fe7-9054-c7c8b7afc676"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bc7e59fe-bea5-4606-9f13-29445e69cfeb"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-06-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:53:32.264425+00:00, try_number=1, job_id=644, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-07 00:00:00+00:00 +INFO - Started process 5271 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-06-07T00:00:00+00:00', '--job-id', '644', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmphhyh0ir3'] +INFO - Job 644: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180607T000000, start_date=20221111T005332, end_date=20221111T005335 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-06-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:53:35.061584Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bc7e59fe-bea5-4606-9f13-29445e69cfeb"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..ad296449 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:53:43.976370Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dbfc6e21-4a17-39c3-8eeb-078752dffa8a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dbfc6e21-4a17-39c3-8eeb-078752dffa8a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "883c502f-7bb2-4404-96cc-9b331a5cfc83"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-06-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:53:43.976370+00:00, try_number=1, job_id=647, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-08 00:00:00+00:00 +INFO - Started process 5319 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-06-08T00:00:00+00:00', '--job-id', '647', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpm6l310fd'] +INFO - Job 647: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180608T000000, start_date=20221111T005343, end_date=20221111T005346 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-06-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:53:46.896824Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "883c502f-7bb2-4404-96cc-9b331a5cfc83"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..0352201a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:53:44.034383Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dbfc6e21-4a17-39c3-8eeb-078752dffa8a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dbfc6e21-4a17-39c3-8eeb-078752dffa8a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "adc2856c-0953-4020-b742-ab936a41c54f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-06-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:53:44.034383+00:00, try_number=1, job_id=648, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-08 00:00:00+00:00 +INFO - Started process 5321 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-06-08T00:00:00+00:00', '--job-id', '648', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmphiop70c5'] +INFO - Job 648: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180608T000000, start_date=20221111T005344, end_date=20221111T005346 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-06-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:53:46.991243Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "adc2856c-0953-4020-b742-ab936a41c54f"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..366f11c2 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:53:56.832056Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dbfc6e21-4a17-39c3-8eeb-078752dffa8a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dbfc6e21-4a17-39c3-8eeb-078752dffa8a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "feb2fd45-0d24-44ff-bc83-960ad635f3af"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-06-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:53:56.832056+00:00, try_number=1, job_id=652, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-08 00:00:00+00:00 +INFO - Started process 5331 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-06-08T00:00:00+00:00', '--job-id', '652', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpdxbio3o9'] +INFO - Job 652: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498eff70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'U9ndkRAgoZSP8Hvqg/efKg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:U9ndkRAgoZSP8Hvqg/efKg== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005357Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005357Z +20221111/us-east-1/s3/aws4_request +c0760b0fd257cd483862907b93bb1e0a92cd8f8778395328bb80986c6facb5b9 +INFO - '2022-11-11' - botocore.auth - Signature: +fe61bbcb6824212eb427932ad3ab5dfc8a28f28985eb0cb677f69212e9e3503d +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'fLpek79bDSsX3ezq77kgkKMYle2f2TPQgWpJOAa10g6FXgbYRpdQVU5PRZiu7y9JdnQ12dgUhQI=', 'x-amz-request-id': 'QWCS2NZGTGCS6AVZ', 'Date': 'Fri, 11 Nov 2022 00:53:58 GMT', 'ETag': '"53d9dd911020a1948ff07bea83f79f2a"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180608T000000, start_date=20221111T005356, end_date=20221111T005358 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-06-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:53:58.814338Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "feb2fd45-0d24-44ff-bc83-960ad635f3af"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..9bf03ed6 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:53:53.651141Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dbfc6e21-4a17-39c3-8eeb-078752dffa8a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dbfc6e21-4a17-39c3-8eeb-078752dffa8a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a67c6feb-8cf3-4973-9909-f4881e3b9d11"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-06-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:53:53.651141+00:00, try_number=1, job_id=651, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-08 00:00:00+00:00 +INFO - Started process 5392 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-06-08T00:00:00+00:00', '--job-id', '651', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp3_yv64up'] +INFO - Job 651: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50041f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005354Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005354Z +20221111/us-east-1/s3/aws4_request +d25806e9f4a53b1f6a8dee09d6864cf02257cf4a4961b008c4ffdd068f66e7a5 +INFO - '2022-11-11' - botocore.auth - Signature: +57270a9cd4abc427d1be29ea9721bd4155299cf982659572a7844b022aacf724 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'EBQQ/piBjkPH4LSAQUQMhHxpeTuZ4qTwrqnT+7WptNBpG+vpn16D+qxNnjHnGlNLFzoXZUsRIqI=', 'x-amz-request-id': 'QR3SYPQHQAJGKKMY', 'Date': 'Fri, 11 Nov 2022 00:53:55 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180608T000000, start_date=20221111T005353, end_date=20221111T005355 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-06-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:53:55.611220Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a67c6feb-8cf3-4973-9909-f4881e3b9d11"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..661fa656 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:53:48.842041Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dbfc6e21-4a17-39c3-8eeb-078752dffa8a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dbfc6e21-4a17-39c3-8eeb-078752dffa8a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "abfa0a08-aff1-4ac0-be8b-1a36f22b4b3f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-06-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:53:48.842041+00:00, try_number=1, job_id=650, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-08 00:00:00+00:00 +INFO - Started process 5323 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-06-08T00:00:00+00:00', '--job-id', '650', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpp_fgm55r'] +INFO - Job 650: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180608T000000, start_date=20221111T005348, end_date=20221111T005355 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-06-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:53:55.238431Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "abfa0a08-aff1-4ac0-be8b-1a36f22b4b3f"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..e4d3cbbf --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:53:48.842327Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dbfc6e21-4a17-39c3-8eeb-078752dffa8a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dbfc6e21-4a17-39c3-8eeb-078752dffa8a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c727486b-cb0c-46c2-99c6-d108ab834a0a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-06-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:53:48.842327+00:00, try_number=1, job_id=649, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-08 00:00:00+00:00 +INFO - Started process 5325 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-06-08T00:00:00+00:00', '--job-id', '649', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpxmbzaec8'] +INFO - Job 649: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180608T000000, start_date=20221111T005348, end_date=20221111T005351 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-06-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:53:51.647233Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c727486b-cb0c-46c2-99c6-d108ab834a0a"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..a129ab82 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:54:02.053227Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "83ecd6f1-a79a-30b7-867c-6278258bb374"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "83ecd6f1-a79a-30b7-867c-6278258bb374"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cb9a9c1e-0395-4416-b207-147dfed79837"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-06-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:54:02.053227+00:00, try_number=1, job_id=653, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-09 00:00:00+00:00 +INFO - Started process 5365 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-06-09T00:00:00+00:00', '--job-id', '653', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpmg65yb03'] +INFO - Job 653: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180609T000000, start_date=20221111T005402, end_date=20221111T005405 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-06-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:54:05.014593Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cb9a9c1e-0395-4416-b207-147dfed79837"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..9c576956 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:54:02.057372Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "83ecd6f1-a79a-30b7-867c-6278258bb374"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "83ecd6f1-a79a-30b7-867c-6278258bb374"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e626ed2a-f856-47b9-a642-af25f4e5f3be"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-06-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:54:02.057372+00:00, try_number=1, job_id=654, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-09 00:00:00+00:00 +INFO - Started process 5364 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-06-09T00:00:00+00:00', '--job-id', '654', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpcezu8mus'] +INFO - Job 654: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180609T000000, start_date=20221111T005402, end_date=20221111T005405 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-06-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:54:05.024834Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e626ed2a-f856-47b9-a642-af25f4e5f3be"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..b66d088e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:54:14.732403Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "83ecd6f1-a79a-30b7-867c-6278258bb374"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "83ecd6f1-a79a-30b7-867c-6278258bb374"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ee868bba-86b7-4a3c-a7d1-393e3c55617a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-06-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:54:14.732403+00:00, try_number=1, job_id=658, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-09 00:00:00+00:00 +INFO - Started process 5420 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-06-09T00:00:00+00:00', '--job-id', '658', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpfekjuoli'] +INFO - Job 658: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498efca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'U9ndkRAgoZSP8Hvqg/efKg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:U9ndkRAgoZSP8Hvqg/efKg== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005415Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005415Z +20221111/us-east-1/s3/aws4_request +9126a12a8525b405ef672eb779615631c5392c0305d9eb608275994db0c85155 +INFO - '2022-11-11' - botocore.auth - Signature: +b754b207591e65c663794a0a4d784de8603995912a8b61ddeb5feba47b6e189b +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'UXknLKyuJ0qFeQ/szSNvX8AQbYb2QIPKYwiF7kf1zm9++EJ+fKxNrWtzNwGlvqGlpdQtZd1jk8M=', 'x-amz-request-id': 'V5NB50FZCWXG7PZY', 'Date': 'Fri, 11 Nov 2022 00:54:16 GMT', 'ETag': '"53d9dd911020a1948ff07bea83f79f2a"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180609T000000, start_date=20221111T005414, end_date=20221111T005416 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-06-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:54:16.619274Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ee868bba-86b7-4a3c-a7d1-393e3c55617a"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..e4c2369d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:54:11.762592Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "83ecd6f1-a79a-30b7-867c-6278258bb374"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "83ecd6f1-a79a-30b7-867c-6278258bb374"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "064792ba-c710-47c8-9aba-9ec22da4e318"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-06-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:54:11.762592+00:00, try_number=1, job_id=657, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-09 00:00:00+00:00 +INFO - Started process 5413 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-06-09T00:00:00+00:00', '--job-id', '657', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp8_mt0xii'] +INFO - Job 657: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499543a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005412Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005412Z +20221111/us-east-1/s3/aws4_request +02ab2e53ec7ed1756cd6e4ea0a3826c2937420b62acf7691ea32857df115949b +INFO - '2022-11-11' - botocore.auth - Signature: +e3528ed78cd54e08f7b570de2b4c4e4ba131d631246c96e841f34825a34537a0 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'OElTJZytMkj8rXCogtXqa5XLFHw4Me9z4tu8WxS7u6LsVt79K39p6RgpnzTBLA/9v+FC3c7tifs=', 'x-amz-request-id': 'YC469EM27Q3C10CW', 'Date': 'Fri, 11 Nov 2022 00:54:13 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180609T000000, start_date=20221111T005411, end_date=20221111T005413 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-06-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:54:13.677775Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "064792ba-c710-47c8-9aba-9ec22da4e318"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..73f68eac --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:54:07.237850Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "83ecd6f1-a79a-30b7-867c-6278258bb374"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "83ecd6f1-a79a-30b7-867c-6278258bb374"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8c8f9140-d4dd-4d84-87c5-bfc931114849"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-06-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:54:07.237850+00:00, try_number=1, job_id=655, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-09 00:00:00+00:00 +INFO - Started process 5403 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-06-09T00:00:00+00:00', '--job-id', '655', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpruum6v33'] +INFO - Job 655: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180609T000000, start_date=20221111T005407, end_date=20221111T005412 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-06-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:54:12.788790Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8c8f9140-d4dd-4d84-87c5-bfc931114849"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..f093c860 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:54:07.221542Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "83ecd6f1-a79a-30b7-867c-6278258bb374"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "83ecd6f1-a79a-30b7-867c-6278258bb374"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0d1ace67-5067-407f-abdd-6adefc52fe8f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-06-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:54:07.221542+00:00, try_number=1, job_id=656, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-09 00:00:00+00:00 +INFO - Started process 5401 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-06-09T00:00:00+00:00', '--job-id', '656', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp_dnudd2m'] +INFO - Job 656: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180609T000000, start_date=20221111T005407, end_date=20221111T005409 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-06-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:54:09.914382Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0d1ace67-5067-407f-abdd-6adefc52fe8f"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..79fa8576 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:54:19.006067Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c743b4d3-a528-3d6e-b135-82bd39e0ac9c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c743b4d3-a528-3d6e-b135-82bd39e0ac9c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ff0dae12-30c1-4690-9d56-574b45dffcc4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-06-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:54:19.006067+00:00, try_number=1, job_id=660, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-10 00:00:00+00:00 +INFO - Started process 5431 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-06-10T00:00:00+00:00', '--job-id', '660', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpleybm3bu'] +INFO - Job 660: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180610T000000, start_date=20221111T005419, end_date=20221111T005421 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-06-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:54:21.629619Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ff0dae12-30c1-4690-9d56-574b45dffcc4"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..7c4de0d0 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:54:18.905169Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c743b4d3-a528-3d6e-b135-82bd39e0ac9c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c743b4d3-a528-3d6e-b135-82bd39e0ac9c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f9a759ba-9400-48b5-9a68-e8f49f03ad02"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-06-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:54:18.905169+00:00, try_number=1, job_id=659, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-10 00:00:00+00:00 +INFO - Started process 5429 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-06-10T00:00:00+00:00', '--job-id', '659', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpcfoj_hfd'] +INFO - Job 659: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180610T000000, start_date=20221111T005418, end_date=20221111T005421 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-06-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:54:21.663024Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f9a759ba-9400-48b5-9a68-e8f49f03ad02"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..51da3fce --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:54:30.765683Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c743b4d3-a528-3d6e-b135-82bd39e0ac9c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c743b4d3-a528-3d6e-b135-82bd39e0ac9c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "99ab5b59-c6c0-4549-b939-7fedf2558f7e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-06-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:54:30.765683+00:00, try_number=1, job_id=664, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-10 00:00:00+00:00 +INFO - Started process 5491 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-06-10T00:00:00+00:00', '--job-id', '664', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpq1g4g7i6'] +INFO - Job 664: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5ee0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'Sp06VBprK2RVd4ltBET6Ew==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:Sp06VBprK2RVd4ltBET6Ew== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005431Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005431Z +20221111/us-east-1/s3/aws4_request +86678abb5776077625b10bdac177ce27cf6cb5933130805189686e7096639ea2 +INFO - '2022-11-11' - botocore.auth - Signature: +b2c83c05a2434e452339c67bcf172ac68350e9bb3ef45d0902e2a37998650e09 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'hA8JISHEimiuEI4KcJz+WfNPeTq/BsNRaMejV2kmVJKPCAxHQMemY+OIM3/tMe7lByyrer4hQL0=', 'x-amz-request-id': 'BV05965ZGZT5V4K7', 'Date': 'Fri, 11 Nov 2022 00:54:32 GMT', 'ETag': '"4a9d3a541a6b2b645577896d0444fa13"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180610T000000, start_date=20221111T005430, end_date=20221111T005432 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-06-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:54:32.901112Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "99ab5b59-c6c0-4549-b939-7fedf2558f7e"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..91ec0aaa --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:54:28.260942Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c743b4d3-a528-3d6e-b135-82bd39e0ac9c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c743b4d3-a528-3d6e-b135-82bd39e0ac9c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3b179f42-80e3-4ee2-8f58-033489401ada"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-06-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:54:28.260942+00:00, try_number=1, job_id=663, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-10 00:00:00+00:00 +INFO - Started process 5483 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-06-10T00:00:00+00:00', '--job-id', '663', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpsvbf0_j1'] +INFO - Job 663: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50041f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005429Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005429Z +20221111/us-east-1/s3/aws4_request +4fc59fe6d444b8a6d0ac90244b96309ad79998e0a5c74e99632a5ef8dd8dafa9 +INFO - '2022-11-11' - botocore.auth - Signature: +37aca17491c3047f6d49afd9621cd691af3f7f484d96b5a688bc22ad92a59102 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'A8EatHyrJtYtNaQzUHCmCI8s/HGXUMgJcInB5TxEd7bjzIA8RORvV5SyBvsNMdyp7GmpPF+oidM=', 'x-amz-request-id': 'WPH02J9ET1C456GA', 'Date': 'Fri, 11 Nov 2022 00:54:29 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180610T000000, start_date=20221111T005428, end_date=20221111T005430 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-06-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:54:30.286591Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3b179f42-80e3-4ee2-8f58-033489401ada"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..40583b41 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:54:23.467360Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c743b4d3-a528-3d6e-b135-82bd39e0ac9c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c743b4d3-a528-3d6e-b135-82bd39e0ac9c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8397ef5e-d5b9-4167-be60-5ec3021d9b84"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-06-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:54:23.467360+00:00, try_number=1, job_id=661, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-10 00:00:00+00:00 +INFO - Started process 5473 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-06-10T00:00:00+00:00', '--job-id', '661', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpzuemsadr'] +INFO - Job 661: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180610T000000, start_date=20221111T005423, end_date=20221111T005429 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-06-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:54:29.113580Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8397ef5e-d5b9-4167-be60-5ec3021d9b84"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..e3f185d7 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:54:23.531390Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c743b4d3-a528-3d6e-b135-82bd39e0ac9c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c743b4d3-a528-3d6e-b135-82bd39e0ac9c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "80b696cd-479f-44bd-8275-340680713559"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-06-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:54:23.531390+00:00, try_number=1, job_id=662, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-10 00:00:00+00:00 +INFO - Started process 5476 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-06-10T00:00:00+00:00', '--job-id', '662', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpi3d5cq09'] +INFO - Job 662: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180610T000000, start_date=20221111T005423, end_date=20221111T005426 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-06-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:54:26.682491Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "80b696cd-479f-44bd-8275-340680713559"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..ca572e67 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:54:35.168170Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "fce25c89-86aa-3432-9ddb-5dd658e6fc18"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "fce25c89-86aa-3432-9ddb-5dd658e6fc18"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2928fa78-51b3-4af9-857a-13c89856bdca"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-06-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:54:35.168170+00:00, try_number=1, job_id=665, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-11 00:00:00+00:00 +INFO - Started process 5499 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-06-11T00:00:00+00:00', '--job-id', '665', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp5iiu37gf'] +INFO - Job 665: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180611T000000, start_date=20221111T005435, end_date=20221111T005438 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-06-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:54:38.143256Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2928fa78-51b3-4af9-857a-13c89856bdca"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..cbfbdd0c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:54:35.179769Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "fce25c89-86aa-3432-9ddb-5dd658e6fc18"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "fce25c89-86aa-3432-9ddb-5dd658e6fc18"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "dec2a20f-5af7-4f53-b084-307f6802aead"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-06-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:54:35.179769+00:00, try_number=1, job_id=666, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-11 00:00:00+00:00 +INFO - Started process 5502 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-06-11T00:00:00+00:00', '--job-id', '666', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpgvujru2t'] +INFO - Job 666: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180611T000000, start_date=20221111T005435, end_date=20221111T005438 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-06-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:54:38.142010Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "dec2a20f-5af7-4f53-b084-307f6802aead"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..f465352e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:54:47.523820Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "fce25c89-86aa-3432-9ddb-5dd658e6fc18"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "fce25c89-86aa-3432-9ddb-5dd658e6fc18"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "99b4f732-6dc9-4966-9fe4-c104314fadab"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-06-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:54:47.523820+00:00, try_number=1, job_id=670, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-11 00:00:00+00:00 +INFO - Started process 5538 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-06-11T00:00:00+00:00', '--job-id', '670', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpachby7v6'] +INFO - Job 670: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa4f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'IwNo4wg+42dGKwX2/U0PEA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:IwNo4wg+42dGKwX2/U0PEA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005448Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005448Z +20221111/us-east-1/s3/aws4_request +403a324c7113acb45e3064ec292af3717de282b24b25334c87c8f3fb44265302 +INFO - '2022-11-11' - botocore.auth - Signature: +17d27e3e02025829627f9fc664cbf3a588bfae1dfc2132c87ad6e83037e7d2c5 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '59De+GDud2a+SKABoPKYNy/aNkQ3hRuEauzoNVcgaP8xMGW25xzNbPUTZHXw+FP5BwlxCq9YdKA=', 'x-amz-request-id': 'ET9EA8MT3PB9BEZW', 'Date': 'Fri, 11 Nov 2022 00:54:48 GMT', 'ETag': '"230368e3083ee367462b05f6fd4d0f10"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180611T000000, start_date=20221111T005447, end_date=20221111T005449 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-06-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:54:49.247761Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "99b4f732-6dc9-4966-9fe4-c104314fadab"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..9eb855d0 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:54:44.427054Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "fce25c89-86aa-3432-9ddb-5dd658e6fc18"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "fce25c89-86aa-3432-9ddb-5dd658e6fc18"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0e2747b6-579b-4d33-b199-e0fb50a6e8d6"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-06-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:54:44.427054+00:00, try_number=1, job_id=669, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-11 00:00:00+00:00 +INFO - Started process 5502 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-06-11T00:00:00+00:00', '--job-id', '669', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp70ykefq4'] +INFO - Job 669: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499553a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005445Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005445Z +20221111/us-east-1/s3/aws4_request +43ea58260d3d95f8c7da6f4f467a7def6c6c36bacaa7bec503402bfc91974343 +INFO - '2022-11-11' - botocore.auth - Signature: +f1cd4e9a27b71090c7879aca5fe974607e7ee94cd2869def6dabb8c2551ff4d4 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'd8ayAi8Mn5dECrVXgEimweGwTpyMTMPQzikkpCUHiko8ICoVXytMOyfBTFgS6uXVCstEP9G45+4=', 'x-amz-request-id': 'S4NDC0FSD2CR40G2', 'Date': 'Fri, 11 Nov 2022 00:54:45 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180611T000000, start_date=20221111T005444, end_date=20221111T005446 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-06-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:54:46.565377Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0e2747b6-579b-4d33-b199-e0fb50a6e8d6"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..8ec81f98 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:54:39.578156Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "fce25c89-86aa-3432-9ddb-5dd658e6fc18"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "fce25c89-86aa-3432-9ddb-5dd658e6fc18"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "faef7dce-c2a5-46ff-a626-c4c820c7ee3e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-06-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:54:39.578156+00:00, try_number=1, job_id=667, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-11 00:00:00+00:00 +INFO - Started process 5510 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-06-11T00:00:00+00:00', '--job-id', '667', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp6672dsed'] +INFO - Job 667: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180611T000000, start_date=20221111T005439, end_date=20221111T005445 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-06-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:54:45.352267Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "faef7dce-c2a5-46ff-a626-c4c820c7ee3e"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..8ccf36e2 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:54:39.653477Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "fce25c89-86aa-3432-9ddb-5dd658e6fc18"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "fce25c89-86aa-3432-9ddb-5dd658e6fc18"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "76e1235a-812b-4d4f-942e-c59c7fa1237f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-06-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:54:39.653477+00:00, try_number=1, job_id=668, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-11 00:00:00+00:00 +INFO - Started process 5512 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-06-11T00:00:00+00:00', '--job-id', '668', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpk5y6yvhf'] +INFO - Job 668: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180611T000000, start_date=20221111T005439, end_date=20221111T005442 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-06-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:54:42.602865Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "76e1235a-812b-4d4f-942e-c59c7fa1237f"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..24aef303 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:54:51.544451Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cd0539ba-fb88-38a1-b002-b1d8351210c0"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cd0539ba-fb88-38a1-b002-b1d8351210c0"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "13e7cf36-de8d-49b2-a3f3-6a68e2331389"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-06-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:54:51.544451+00:00, try_number=1, job_id=672, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-12 00:00:00+00:00 +INFO - Started process 5576 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-06-12T00:00:00+00:00', '--job-id', '672', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmprskx1pwc'] +INFO - Job 672: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180612T000000, start_date=20221111T005451, end_date=20221111T005454 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-06-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:54:54.711723Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "13e7cf36-de8d-49b2-a3f3-6a68e2331389"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..2537928f --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:54:51.544372Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cd0539ba-fb88-38a1-b002-b1d8351210c0"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cd0539ba-fb88-38a1-b002-b1d8351210c0"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c4c25450-aad5-4a57-8e74-b0b4de5f334d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-06-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:54:51.544372+00:00, try_number=1, job_id=671, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-12 00:00:00+00:00 +INFO - Started process 5577 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-06-12T00:00:00+00:00', '--job-id', '671', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp6m12bgqw'] +INFO - Job 671: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180612T000000, start_date=20221111T005451, end_date=20221111T005454 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-06-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:54:54.538303Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c4c25450-aad5-4a57-8e74-b0b4de5f334d"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..d3b2c1be --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:55:12.219392Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cd0539ba-fb88-38a1-b002-b1d8351210c0"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cd0539ba-fb88-38a1-b002-b1d8351210c0"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a39daf6d-6492-4e5e-9008-7ef78435c258"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-06-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:55:12.219392+00:00, try_number=1, job_id=676, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-12 00:00:00+00:00 +INFO - Started process 5576 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-06-12T00:00:00+00:00', '--job-id', '676', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpkvxrxlhx'] +INFO - Job 676: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f1f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'U9ndkRAgoZSP8Hvqg/efKg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:U9ndkRAgoZSP8Hvqg/efKg== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005513Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005513Z +20221111/us-east-1/s3/aws4_request +950aac4c094b7c55997dfee756d67114d809c29d9179b81f72eeedaf61810e83 +INFO - '2022-11-11' - botocore.auth - Signature: +aae48eb1dc4be7315bc8fa50bc19b6990e81e3b2cc73487a0a553e65940cdf8b +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 't47arG9lG0E4SBgjmxTBNKnYr4rYoifePoRc9Z+gs9XsEwv3QAsT53WMXnVDrJoPATE1rFKSFP4=', 'x-amz-request-id': 'C47929X6SQED7M8X', 'Date': 'Fri, 11 Nov 2022 00:55:13 GMT', 'ETag': '"53d9dd911020a1948ff07bea83f79f2a"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180612T000000, start_date=20221111T005512, end_date=20221111T005514 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-06-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:55:14.494019Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a39daf6d-6492-4e5e-9008-7ef78435c258"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..c8730af6 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:55:02.257912Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cd0539ba-fb88-38a1-b002-b1d8351210c0"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cd0539ba-fb88-38a1-b002-b1d8351210c0"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "953ad248-cd50-484e-a038-8216bdd448ae"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-06-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:55:02.257912+00:00, try_number=1, job_id=675, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-12 00:00:00+00:00 +INFO - Started process 5523 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-06-12T00:00:00+00:00', '--job-id', '675', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp04sprcvf'] +INFO - Job 675: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499543a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005503Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005503Z +20221111/us-east-1/s3/aws4_request +5c4d43e05c0d523886691bd8c23568e5f582af2eab14e2298ee46bf07d8d48f3 +INFO - '2022-11-11' - botocore.auth - Signature: +334a9d2622810be3a2a4f2b8e56204304fc1252868ea4a512041932a37712768 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 't/28mmNbdbTt1BdsPBmiuSEYlbXKkfynsD3XTJjCavCvxcEORCwbpuEKz03zZZ0rOd5ptlaxtSg=', 'x-amz-request-id': 'CFWDJ88PMKBQ8V6Q', 'Date': 'Fri, 11 Nov 2022 00:55:03 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180612T000000, start_date=20221111T005502, end_date=20221111T005504 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-06-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:55:04.696120Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "953ad248-cd50-484e-a038-8216bdd448ae"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..c9b21034 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:54:56.951880Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cd0539ba-fb88-38a1-b002-b1d8351210c0"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cd0539ba-fb88-38a1-b002-b1d8351210c0"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "57878409-dae2-484e-9b35-0ae695ad83c2"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-06-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:54:56.951880+00:00, try_number=1, job_id=674, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-12 00:00:00+00:00 +INFO - Started process 5599 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-06-12T00:00:00+00:00', '--job-id', '674', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpnffe30pj'] +INFO - Job 674: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180612T000000, start_date=20221111T005456, end_date=20221111T005509 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-06-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:55:09.302331Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "57878409-dae2-484e-9b35-0ae695ad83c2"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..6cce9e56 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:54:56.955310Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cd0539ba-fb88-38a1-b002-b1d8351210c0"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cd0539ba-fb88-38a1-b002-b1d8351210c0"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4d698cb0-0521-46da-9b4a-e6aa6f5b76e9"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-06-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:54:56.955310+00:00, try_number=1, job_id=673, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-12 00:00:00+00:00 +INFO - Started process 5596 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-06-12T00:00:00+00:00', '--job-id', '673', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp52zoxlwq'] +INFO - Job 673: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180612T000000, start_date=20221111T005456, end_date=20221111T005500 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-06-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:55:00.264448Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4d698cb0-0521-46da-9b4a-e6aa6f5b76e9"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..c9e928c5 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:55:18.283521Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "def3c91a-4c8f-36ff-8697-fbe7a94fc3ad"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "def3c91a-4c8f-36ff-8697-fbe7a94fc3ad"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e8da5fbe-84f7-4502-b413-0c2de41c7b16"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-06-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:55:18.283521+00:00, try_number=1, job_id=677, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-13 00:00:00+00:00 +INFO - Started process 5606 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-06-13T00:00:00+00:00', '--job-id', '677', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpp0e_fy1t'] +INFO - Job 677: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180613T000000, start_date=20221111T005518, end_date=20221111T005523 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-06-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:55:23.289990Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e8da5fbe-84f7-4502-b413-0c2de41c7b16"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..d2b1c744 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:55:18.435197Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "def3c91a-4c8f-36ff-8697-fbe7a94fc3ad"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "def3c91a-4c8f-36ff-8697-fbe7a94fc3ad"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "eabe94c2-5c67-4034-a316-f8c6a37e07d8"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-06-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:55:18.435197+00:00, try_number=1, job_id=678, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-13 00:00:00+00:00 +INFO - Started process 5609 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-06-13T00:00:00+00:00', '--job-id', '678', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp3695_xs0'] +INFO - Job 678: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180613T000000, start_date=20221111T005518, end_date=20221111T005523 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-06-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:55:23.431168Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "eabe94c2-5c67-4034-a316-f8c6a37e07d8"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..e417a15d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:55:39.181506Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "def3c91a-4c8f-36ff-8697-fbe7a94fc3ad"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "def3c91a-4c8f-36ff-8697-fbe7a94fc3ad"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5f7c6bc5-20db-4d6d-96a6-67198809b9d6"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-06-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:55:39.181506+00:00, try_number=1, job_id=682, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-13 00:00:00+00:00 +INFO - Started process 5593 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-06-13T00:00:00+00:00', '--job-id', '682', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpgky86bgf'] +INFO - Job 682: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f1f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'rXySpXarDeZJAid0NpB6WQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:rXySpXarDeZJAid0NpB6WQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005540Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005540Z +20221111/us-east-1/s3/aws4_request +bee903ddfa123e673d65632a3ea9b4ddba3b4b3a119b0831459137d59576326e +INFO - '2022-11-11' - botocore.auth - Signature: +8f316b08a829ab7bf7e903003377f5f1e3e7be0076dd57aa816dd9b522f4a88c +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'mCNfp2YlDJv9OzO4iaR6fskrUYVWr4igpM1F73gubCe3OjYwWOsxpE3X8dt6koHmskEcU6rpoUY=', 'x-amz-request-id': 'RE4KMMBYNM3RD65P', 'Date': 'Fri, 11 Nov 2022 00:55:40 GMT', 'ETag': '"ad7c92a576ab0de64902277436907a59"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180613T000000, start_date=20221111T005539, end_date=20221111T005541 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-06-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:55:41.459033Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5f7c6bc5-20db-4d6d-96a6-67198809b9d6"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..4a7c5ed0 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:55:32.563910Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "def3c91a-4c8f-36ff-8697-fbe7a94fc3ad"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "def3c91a-4c8f-36ff-8697-fbe7a94fc3ad"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9eb9976a-841f-4250-a2d1-dfc5f18d568b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-06-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:55:32.563910+00:00, try_number=1, job_id=681, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-13 00:00:00+00:00 +INFO - Started process 5615 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-06-13T00:00:00+00:00', '--job-id', '681', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmps0a1z_ma'] +INFO - Job 681: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50063a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005534Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005534Z +20221111/us-east-1/s3/aws4_request +a06d54368b3a85dcfe7360e42f2c6fcaa35c7ec2ff10ba984ca51e7976c601c6 +INFO - '2022-11-11' - botocore.auth - Signature: +018b51adf2f30326d6a011c8c8882220fd3bee0cc292f4a66271524abb4c32e6 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'TT7Lx2u9LcZYB5j5fi0BR0l0yVNd7eGki6KAJ7vB4HVYiizDr2yS3MG2aKtDiDsTPDyXhUstaNI=', 'x-amz-request-id': 'TZ3FMEGMF8D7Z3F9', 'Date': 'Fri, 11 Nov 2022 00:55:34 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180613T000000, start_date=20221111T005532, end_date=20221111T005535 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-06-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:55:35.341932Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9eb9976a-841f-4250-a2d1-dfc5f18d568b"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..eef5337d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:55:26.157164Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "def3c91a-4c8f-36ff-8697-fbe7a94fc3ad"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "def3c91a-4c8f-36ff-8697-fbe7a94fc3ad"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "538f1e34-ba7a-4bc0-a6c0-b2e4a5ddf168"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-06-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:55:26.157164+00:00, try_number=1, job_id=680, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-13 00:00:00+00:00 +INFO - Started process 5587 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-06-13T00:00:00+00:00', '--job-id', '680', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmphmav4let'] +INFO - Job 680: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180613T000000, start_date=20221111T005526, end_date=20221111T005536 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-06-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:55:36.986193Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "538f1e34-ba7a-4bc0-a6c0-b2e4a5ddf168"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..d81ad702 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:55:26.002695Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "def3c91a-4c8f-36ff-8697-fbe7a94fc3ad"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "def3c91a-4c8f-36ff-8697-fbe7a94fc3ad"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "aa3254e7-8d72-4818-989a-4d3d5a6fb574"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-06-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:55:26.002695+00:00, try_number=1, job_id=679, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-13 00:00:00+00:00 +INFO - Started process 5585 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-06-13T00:00:00+00:00', '--job-id', '679', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpwfndf1pk'] +INFO - Job 679: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180613T000000, start_date=20221111T005526, end_date=20221111T005530 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-06-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:55:30.075643Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "aa3254e7-8d72-4818-989a-4d3d5a6fb574"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..d0a349e8 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:55:45.304196Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "baa4455a-8415-3df5-a6be-803e4c6cae60"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "baa4455a-8415-3df5-a6be-803e4c6cae60"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d843a1a4-e935-49b1-a1c3-f920e7303ea8"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-06-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:55:45.304196+00:00, try_number=1, job_id=683, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-14 00:00:00+00:00 +INFO - Started process 5601 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-06-14T00:00:00+00:00', '--job-id', '683', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpdf0jls7c'] +INFO - Job 683: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180614T000000, start_date=20221111T005545, end_date=20221111T005548 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-06-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:55:48.348762Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d843a1a4-e935-49b1-a1c3-f920e7303ea8"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..4e9dee46 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:55:45.906462Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "baa4455a-8415-3df5-a6be-803e4c6cae60"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "baa4455a-8415-3df5-a6be-803e4c6cae60"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4a1f8d27-c31a-4d4b-b468-da74fe5c7f99"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-06-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:55:45.906462+00:00, try_number=1, job_id=684, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-14 00:00:00+00:00 +INFO - Started process 5604 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-06-14T00:00:00+00:00', '--job-id', '684', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp37rtx19_'] +INFO - Job 684: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180614T000000, start_date=20221111T005545, end_date=20221111T005548 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-06-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:55:48.765591Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4a1f8d27-c31a-4d4b-b468-da74fe5c7f99"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..30095cc4 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:55:58.205843Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "baa4455a-8415-3df5-a6be-803e4c6cae60"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "baa4455a-8415-3df5-a6be-803e4c6cae60"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9920a8e7-d6db-43e3-a9f9-b1a604cc2c29"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-06-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:55:58.205843+00:00, try_number=1, job_id=688, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-14 00:00:00+00:00 +INFO - Started process 5675 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-06-14T00:00:00+00:00', '--job-id', '688', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpn_667vkn'] +INFO - Job 688: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498efee0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'rXySpXarDeZJAid0NpB6WQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:rXySpXarDeZJAid0NpB6WQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005558Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005558Z +20221111/us-east-1/s3/aws4_request +24a9190d2e3324f04688112c1037ba7b0bbb4e1a331a87623dca4a351e2aa662 +INFO - '2022-11-11' - botocore.auth - Signature: +280ac4ed7cccffbadd6afe7a3948ff2e9ab06d321be31d5c62c33fee383144c4 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'IPWEd+fRNdeBwZ16RsuYoXLL5GBuKV0/qOUdSn97r0/wUPjPkT6KOu3LEKwopq3kXxJ40sCOcfU=', 'x-amz-request-id': '4DC44K9FN2F3RZ51', 'Date': 'Fri, 11 Nov 2022 00:55:59 GMT', 'ETag': '"ad7c92a576ab0de64902277436907a59"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180614T000000, start_date=20221111T005558, end_date=20221111T005559 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-06-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:55:59.898951Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9920a8e7-d6db-43e3-a9f9-b1a604cc2c29"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..5c18f48d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:55:55.642165Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "baa4455a-8415-3df5-a6be-803e4c6cae60"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "baa4455a-8415-3df5-a6be-803e4c6cae60"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fd0fd2b5-5edc-4190-861f-c1b5eb2697f3"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-06-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:55:55.642165+00:00, try_number=1, job_id=687, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-14 00:00:00+00:00 +INFO - Started process 5691 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-06-14T00:00:00+00:00', '--job-id', '687', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmptt7tuard'] +INFO - Job 687: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50071f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005556Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005556Z +20221111/us-east-1/s3/aws4_request +1f2fc8152455473ae88484280ae70250cc183d87f975d860eca92391ca64ee86 +INFO - '2022-11-11' - botocore.auth - Signature: +9e75a2a8eda16b85364580066c96033999ddb82a2bc8b48b041ca1119540ef06 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '425WiUBOcJkdfsrM1FYkiwTAJ7vIJESjN4M2FAj9RaeF0aJZKa2neNA+5yZbuJ8aqg50ErRJnwfeFIeCyRrzwQ==', 'x-amz-request-id': 'RCV4CM7H95J2KP43', 'Date': 'Fri, 11 Nov 2022 00:55:57 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180614T000000, start_date=20221111T005555, end_date=20221111T005557 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-06-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:55:57.635711Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fd0fd2b5-5edc-4190-861f-c1b5eb2697f3"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..153381bf --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:55:51.090198Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "baa4455a-8415-3df5-a6be-803e4c6cae60"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "baa4455a-8415-3df5-a6be-803e4c6cae60"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0857933d-44e2-4871-8104-ac20318b017b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-06-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:55:51.090198+00:00, try_number=1, job_id=686, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-14 00:00:00+00:00 +INFO - Started process 5686 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-06-14T00:00:00+00:00', '--job-id', '686', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpngznrtqy'] +INFO - Job 686: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180614T000000, start_date=20221111T005551, end_date=20221111T005556 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-06-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:55:56.522106Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0857933d-44e2-4871-8104-ac20318b017b"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..6b2a9a4a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:55:51.070151Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "baa4455a-8415-3df5-a6be-803e4c6cae60"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "baa4455a-8415-3df5-a6be-803e4c6cae60"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cbf187b9-aba4-48a0-ba92-a44f135d0e5b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-06-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:55:51.070151+00:00, try_number=1, job_id=685, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-14 00:00:00+00:00 +INFO - Started process 5685 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-06-14T00:00:00+00:00', '--job-id', '685', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpcnv3j2wa'] +INFO - Job 685: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180614T000000, start_date=20221111T005551, end_date=20221111T005553 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-06-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:55:53.952688Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cbf187b9-aba4-48a0-ba92-a44f135d0e5b"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..3c4da89b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:56:02.381820Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a872a19d-58a2-3bde-bae8-edd4d19d8810"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a872a19d-58a2-3bde-bae8-edd4d19d8810"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6f819a5d-2064-4cc5-a5af-7c25925bb079"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-06-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:56:02.381820+00:00, try_number=1, job_id=690, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-15 00:00:00+00:00 +INFO - Started process 5703 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-06-15T00:00:00+00:00', '--job-id', '690', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmptlgvgtb8'] +INFO - Job 690: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180615T000000, start_date=20221111T005602, end_date=20221111T005605 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-06-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:56:05.265654Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6f819a5d-2064-4cc5-a5af-7c25925bb079"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..c9d7e01b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:56:02.371013Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a872a19d-58a2-3bde-bae8-edd4d19d8810"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a872a19d-58a2-3bde-bae8-edd4d19d8810"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "436d7f8b-dbfd-4522-9583-6d333aec5553"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-06-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:56:02.371013+00:00, try_number=1, job_id=689, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-15 00:00:00+00:00 +INFO - Started process 5701 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-06-15T00:00:00+00:00', '--job-id', '689', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpipudlwwq'] +INFO - Job 689: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180615T000000, start_date=20221111T005602, end_date=20221111T005605 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-06-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:56:05.288928Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "436d7f8b-dbfd-4522-9583-6d333aec5553"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..7679d880 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:56:15.180342Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a872a19d-58a2-3bde-bae8-edd4d19d8810"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a872a19d-58a2-3bde-bae8-edd4d19d8810"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b9f39dc9-c819-40fe-a5ce-96f00d8f1866"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-06-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:56:15.180342+00:00, try_number=1, job_id=694, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-15 00:00:00+00:00 +INFO - Started process 5774 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-06-15T00:00:00+00:00', '--job-id', '694', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp413359kg'] +INFO - Job 694: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6ee0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'JBGWtitYC76rVkAE1NCBWw==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:JBGWtitYC76rVkAE1NCBWw== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005615Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005615Z +20221111/us-east-1/s3/aws4_request +aa4d2888f9e6c7d9fbb375045bef3e88aed380730b7d31d7d8376647d5f4d55a +INFO - '2022-11-11' - botocore.auth - Signature: +2b72e0b0ad77a1b79a96115b6559f3c4ec4008512e2522b7db48c83fca6bb454 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'uwTcitdgF57p6zHuYFW/MbkUjnvurhlvcA+reYP+ffv4VsMm6ppmMPtUjzyAlxR+lEgpC9k1QUg=', 'x-amz-request-id': 'TAP37P87AFQHETDT', 'Date': 'Fri, 11 Nov 2022 00:56:16 GMT', 'ETag': '"241196b62b580bbeab564004d4d0815b"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180615T000000, start_date=20221111T005615, end_date=20221111T005616 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-06-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:56:16.891227Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b9f39dc9-c819-40fe-a5ce-96f00d8f1866"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..35c8dd4c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:56:12.892072Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a872a19d-58a2-3bde-bae8-edd4d19d8810"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a872a19d-58a2-3bde-bae8-edd4d19d8810"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5bcaebf4-ed5c-4c42-bfd4-0523b3e59c22"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-06-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:56:12.892072+00:00, try_number=1, job_id=693, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-15 00:00:00+00:00 +INFO - Started process 5692 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-06-15T00:00:00+00:00', '--job-id', '693', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpxfzk4kk6'] +INFO - Job 693: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499543a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005613Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005613Z +20221111/us-east-1/s3/aws4_request +9350135a509e1bc0b367e22d5e05b6013cfd1d8ef60695456a16e2b30dde3129 +INFO - '2022-11-11' - botocore.auth - Signature: +c544eac7945a4ede068ca9de35dce97aee31b47fac3314c4cd1f1795dfe38d42 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'tMj6PQFiX6j8pRBrdSI6QFVUUNeLCxa1gu89ieD1GiBjojTCw0BajRSIn58JbYOcg1JIihVRiHA=', 'x-amz-request-id': 'P1V71DG5427K3X47', 'Date': 'Fri, 11 Nov 2022 00:56:14 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180615T000000, start_date=20221111T005612, end_date=20221111T005614 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-06-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:56:14.603043Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5bcaebf4-ed5c-4c42-bfd4-0523b3e59c22"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..90cd782d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:56:08.326070Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a872a19d-58a2-3bde-bae8-edd4d19d8810"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a872a19d-58a2-3bde-bae8-edd4d19d8810"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c284aff6-6d78-49dd-bc8f-6569b2cc134c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-06-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:56:08.326070+00:00, try_number=1, job_id=692, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-15 00:00:00+00:00 +INFO - Started process 5686 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-06-15T00:00:00+00:00', '--job-id', '692', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpc0j95hdl'] +INFO - Job 692: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180615T000000, start_date=20221111T005608, end_date=20221111T005612 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-06-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:56:12.919232Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c284aff6-6d78-49dd-bc8f-6569b2cc134c"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..a900e870 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:56:08.232350Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a872a19d-58a2-3bde-bae8-edd4d19d8810"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a872a19d-58a2-3bde-bae8-edd4d19d8810"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9f303b56-1c8c-4cb7-83c4-895705fe3be4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-06-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:56:08.232350+00:00, try_number=1, job_id=691, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-15 00:00:00+00:00 +INFO - Started process 5684 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-06-15T00:00:00+00:00', '--job-id', '691', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpucpuzz8q'] +INFO - Job 691: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180615T000000, start_date=20221111T005608, end_date=20221111T005610 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-06-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:56:10.930724Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9f303b56-1c8c-4cb7-83c4-895705fe3be4"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..e048968f --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:56:20.242453Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cbe09b8f-c06a-30f9-963f-cc5b8a38e1e1"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cbe09b8f-c06a-30f9-963f-cc5b8a38e1e1"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "46d0fd9f-1c02-4919-9f20-b63e2e276cb5"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-06-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:56:20.242453+00:00, try_number=1, job_id=695, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-16 00:00:00+00:00 +INFO - Started process 5784 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-06-16T00:00:00+00:00', '--job-id', '695', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpypmqlztl'] +INFO - Job 695: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180616T000000, start_date=20221111T005620, end_date=20221111T005623 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-06-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:56:23.312695Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "46d0fd9f-1c02-4919-9f20-b63e2e276cb5"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..d38212c1 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:56:20.254983Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cbe09b8f-c06a-30f9-963f-cc5b8a38e1e1"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cbe09b8f-c06a-30f9-963f-cc5b8a38e1e1"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2717cc25-a262-4bc0-ac50-5a4d55a40d52"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-06-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:56:20.254983+00:00, try_number=1, job_id=696, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-16 00:00:00+00:00 +INFO - Started process 5785 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-06-16T00:00:00+00:00', '--job-id', '696', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp4gzwif53'] +INFO - Job 696: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180616T000000, start_date=20221111T005620, end_date=20221111T005623 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-06-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:56:23.336207Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2717cc25-a262-4bc0-ac50-5a4d55a40d52"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..3417fe3e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:56:32.168560Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cbe09b8f-c06a-30f9-963f-cc5b8a38e1e1"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cbe09b8f-c06a-30f9-963f-cc5b8a38e1e1"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7b460c54-adef-4df2-a4a7-eff96929be77"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-06-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:56:32.168560+00:00, try_number=1, job_id=700, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-16 00:00:00+00:00 +INFO - Started process 5801 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-06-16T00:00:00+00:00', '--job-id', '700', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpqk1bgv_q'] +INFO - Job 700: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'qGrMry6MBumuzQaOq0lcaQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:qGrMry6MBumuzQaOq0lcaQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005632Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005632Z +20221111/us-east-1/s3/aws4_request +bff40113a8d9366c3d30fd74af87afc36226cc65d15d8bbbfed07320038b038e +INFO - '2022-11-11' - botocore.auth - Signature: +9888c22030178ab66cd139caf12bc1e877e482fea5f110991d64c2b26cba5675 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '9NehuzYBT1NVRyua+vp/fqeTyjArDsnB6C+zjQ/Bciy2kIK1ek9z8+6XMpBzXeq3tYYAQLDnVTM=', 'x-amz-request-id': 'BFFGHC6YAB8NX81T', 'Date': 'Fri, 11 Nov 2022 00:56:33 GMT', 'ETag': '"a86accaf2e8c06e9aecd068eab495c69"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180616T000000, start_date=20221111T005632, end_date=20221111T005633 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-06-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:56:33.897708Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7b460c54-adef-4df2-a4a7-eff96929be77"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..332a52d5 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:56:29.385452Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cbe09b8f-c06a-30f9-963f-cc5b8a38e1e1"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cbe09b8f-c06a-30f9-963f-cc5b8a38e1e1"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9e5c9f78-757d-481b-89a6-a3356f504b9a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-06-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:56:29.385452+00:00, try_number=1, job_id=699, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-16 00:00:00+00:00 +INFO - Started process 5764 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-06-16T00:00:00+00:00', '--job-id', '699', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpkuk4ntwb'] +INFO - Job 699: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499521f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005630Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005630Z +20221111/us-east-1/s3/aws4_request +a3961de7c99a0ae55126ffef8782d12d6b3f0842fa604c32d62168d0c28b3f7f +INFO - '2022-11-11' - botocore.auth - Signature: +30fc1d475ad36cf493694050d24ec76779110166787f2f52e112a99ea8a82029 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '2Xq5aH5nlm0Mx/9ZOGKPSN/G9M7zOZ0UDB+jRI1Ha2TUNstM6A7AC7Sk0a/6/0YSePfwCnm9eRc=', 'x-amz-request-id': '2CK1S4G1B14C07A8', 'Date': 'Fri, 11 Nov 2022 00:56:31 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180616T000000, start_date=20221111T005629, end_date=20221111T005631 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-06-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:56:31.765579Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9e5c9f78-757d-481b-89a6-a3356f504b9a"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..596ad0c3 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:56:25.173206Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cbe09b8f-c06a-30f9-963f-cc5b8a38e1e1"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cbe09b8f-c06a-30f9-963f-cc5b8a38e1e1"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5f5dca56-486a-422f-a851-617f8c91784d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-06-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:56:25.173206+00:00, try_number=1, job_id=698, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-16 00:00:00+00:00 +INFO - Started process 5795 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-06-16T00:00:00+00:00', '--job-id', '698', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmptl_ykyx3'] +INFO - Job 698: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180616T000000, start_date=20221111T005625, end_date=20221111T005630 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-06-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:56:30.852499Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5f5dca56-486a-422f-a851-617f8c91784d"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..f475b02b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:56:25.157375Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cbe09b8f-c06a-30f9-963f-cc5b8a38e1e1"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "cbe09b8f-c06a-30f9-963f-cc5b8a38e1e1"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "729f25fc-5a41-4c42-b067-17e648b2792a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-06-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:56:25.157375+00:00, try_number=1, job_id=697, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-16 00:00:00+00:00 +INFO - Started process 5794 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-06-16T00:00:00+00:00', '--job-id', '697', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmptogxm69q'] +INFO - Job 697: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180616T000000, start_date=20221111T005625, end_date=20221111T005627 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-06-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:56:27.774139Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "729f25fc-5a41-4c42-b067-17e648b2792a"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..7d0fdd24 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:56:36.299701Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "282f89da-42e0-350c-b2d2-826307feea39"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "282f89da-42e0-350c-b2d2-826307feea39"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4d9e3360-bd45-43cd-95c9-e8e23e5d5754"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-06-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:56:36.299701+00:00, try_number=1, job_id=702, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-17 00:00:00+00:00 +INFO - Started process 5837 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-06-17T00:00:00+00:00', '--job-id', '702', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpen0bs47z'] +INFO - Job 702: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180617T000000, start_date=20221111T005636, end_date=20221111T005639 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-06-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:56:39.006685Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4d9e3360-bd45-43cd-95c9-e8e23e5d5754"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..6be23a17 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:56:36.294573Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "282f89da-42e0-350c-b2d2-826307feea39"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "282f89da-42e0-350c-b2d2-826307feea39"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "64cecfa1-b117-4214-9e0d-7fd62b134763"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-06-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:56:36.294573+00:00, try_number=1, job_id=701, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-17 00:00:00+00:00 +INFO - Started process 5832 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-06-17T00:00:00+00:00', '--job-id', '701', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp_q4uzmz5'] +INFO - Job 701: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180617T000000, start_date=20221111T005636, end_date=20221111T005639 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-06-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:56:39.021712Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "64cecfa1-b117-4214-9e0d-7fd62b134763"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..b306c8c4 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:56:48.802476Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "282f89da-42e0-350c-b2d2-826307feea39"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "282f89da-42e0-350c-b2d2-826307feea39"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7ca0a6bb-90e2-488d-af07-326806651762"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-06-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:56:48.802476+00:00, try_number=1, job_id=706, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-17 00:00:00+00:00 +INFO - Started process 5788 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-06-17T00:00:00+00:00', '--job-id', '706', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp4866m52k'] +INFO - Job 706: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'C+U2/uOM7InKjnMmIOQ68w==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:C+U2/uOM7InKjnMmIOQ68w== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005649Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005649Z +20221111/us-east-1/s3/aws4_request +93b209aea4d57c6b856876432ddccb6ea692a5a7cf072d8631c16dadfcaeb79a +INFO - '2022-11-11' - botocore.auth - Signature: +37310042672f3bd9073ba666a14607325cb21ea0603dd3ff2b475bb81145dd09 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'H1CefxCsEvnPg1b5kumDbqnmzG72yl9E5bEniehXht+Lm7QcHfV6YgpXer6PVMkll8P6CS5Op1U=', 'x-amz-request-id': 'J63TW8T77ARH56XC', 'Date': 'Fri, 11 Nov 2022 00:56:50 GMT', 'ETag': '"0be536fee38cec89ca8e732620e43af3"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180617T000000, start_date=20221111T005648, end_date=20221111T005650 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-06-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:56:50.642503Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7ca0a6bb-90e2-488d-af07-326806651762"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..f17c0faa --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:56:45.916928Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "282f89da-42e0-350c-b2d2-826307feea39"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "282f89da-42e0-350c-b2d2-826307feea39"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "286df37f-6bb7-497b-b05e-bf4721b45cb8"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-06-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:56:45.916928+00:00, try_number=1, job_id=705, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-17 00:00:00+00:00 +INFO - Started process 5780 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-06-17T00:00:00+00:00', '--job-id', '705', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp7ik0dj5z'] +INFO - Job 705: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499523a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005646Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005646Z +20221111/us-east-1/s3/aws4_request +9f9030d8bb9696b719b2882c45cc55ff150bb4c66b213f4bf95fb2374e04dd80 +INFO - '2022-11-11' - botocore.auth - Signature: +3faa4e88b07729f22e8db4d48ce06c8d912c0f086251ce4c3131218ba7bff6b3 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '5NztTIKGMI16WU9mZYgNghLV12Ece1ctjgHjukSWJO4P8W72+Dhk/xl8ei3Ez0r1qMb20r3CWcw=', 'x-amz-request-id': 'HCAYFE1DG9HQGP1J', 'Date': 'Fri, 11 Nov 2022 00:56:47 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180617T000000, start_date=20221111T005645, end_date=20221111T005647 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-06-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:56:47.851460Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "286df37f-6bb7-497b-b05e-bf4721b45cb8"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..8ec80f46 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:56:41.017272Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "282f89da-42e0-350c-b2d2-826307feea39"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "282f89da-42e0-350c-b2d2-826307feea39"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a2c0481b-523d-466b-b89c-d8e7ddaac2f0"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-06-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:56:41.017272+00:00, try_number=1, job_id=704, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-17 00:00:00+00:00 +INFO - Started process 5775 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-06-17T00:00:00+00:00', '--job-id', '704', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp_mppv2de'] +INFO - Job 704: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180617T000000, start_date=20221111T005641, end_date=20221111T005646 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-06-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:56:46.438172Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a2c0481b-523d-466b-b89c-d8e7ddaac2f0"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..fcec3502 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:56:41.011040Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "282f89da-42e0-350c-b2d2-826307feea39"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "282f89da-42e0-350c-b2d2-826307feea39"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b6e6fc05-2650-42c5-a1e9-6a82a41fed6e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-06-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:56:41.011040+00:00, try_number=1, job_id=703, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-17 00:00:00+00:00 +INFO - Started process 5773 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-06-17T00:00:00+00:00', '--job-id', '703', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpfoiw74om'] +INFO - Job 703: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180617T000000, start_date=20221111T005641, end_date=20221111T005643 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-06-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:56:43.881767Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b6e6fc05-2650-42c5-a1e9-6a82a41fed6e"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..7364a445 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:56:53.184479Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d8428e82-bfa5-3b48-aa7e-e17a6d8893d6"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d8428e82-bfa5-3b48-aa7e-e17a6d8893d6"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8d2cdcda-ebd7-40c7-9943-6e15d4afffeb"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-06-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:56:53.184479+00:00, try_number=1, job_id=708, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-18 00:00:00+00:00 +INFO - Started process 5861 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-06-18T00:00:00+00:00', '--job-id', '708', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmponjoiqcc'] +INFO - Job 708: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180618T000000, start_date=20221111T005653, end_date=20221111T005656 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-06-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:56:56.166139Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8d2cdcda-ebd7-40c7-9943-6e15d4afffeb"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..faf2ea64 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:56:53.184606Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d8428e82-bfa5-3b48-aa7e-e17a6d8893d6"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d8428e82-bfa5-3b48-aa7e-e17a6d8893d6"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "93222119-3f2e-438e-87b4-2b7d24e72ab4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-06-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:56:53.184606+00:00, try_number=1, job_id=707, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-18 00:00:00+00:00 +INFO - Started process 5864 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-06-18T00:00:00+00:00', '--job-id', '707', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpbtue3iwk'] +INFO - Job 707: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180618T000000, start_date=20221111T005653, end_date=20221111T005655 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-06-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:56:55.914449Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "93222119-3f2e-438e-87b4-2b7d24e72ab4"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..60d46b19 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:57:04.244346Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d8428e82-bfa5-3b48-aa7e-e17a6d8893d6"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d8428e82-bfa5-3b48-aa7e-e17a6d8893d6"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "64001fdd-542b-45c2-9d5b-f5b99c8b8acb"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-06-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:57:04.244346+00:00, try_number=1, job_id=712, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-18 00:00:00+00:00 +INFO - Started process 5893 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-06-18T00:00:00+00:00', '--job-id', '712', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpukei9o4b'] +INFO - Job 712: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'KcYQ384FxRa2WB43lz+ZPA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:KcYQ384FxRa2WB43lz+ZPA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005705Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005705Z +20221111/us-east-1/s3/aws4_request +e39e6848e26f6fe283039ad2e2d5942f95eeb7cb5f0ea440bf5b7c75f75a97bb +INFO - '2022-11-11' - botocore.auth - Signature: +1240dbc64a6d3cb23cfe0023ce6b5d8ffa3a5dd6e3b9d1df62bb6402bdaa5b5b +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '+UmkvzVJ6ukkYjPcPJMPLnOgRJ2Ncif8dFDtrIte69X62K79T8VxZ4NBRMxiBkNo/e7CceaWQV4=', 'x-amz-request-id': 'FE17WAVAJ073TF21', 'Date': 'Fri, 11 Nov 2022 00:57:05 GMT', 'ETag': '"29c610dfce05c516b6581e37973f993c"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180618T000000, start_date=20221111T005704, end_date=20221111T005706 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-06-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:57:06.140630Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "64001fdd-542b-45c2-9d5b-f5b99c8b8acb"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..4ce32dbe --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:57:02.473029Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d8428e82-bfa5-3b48-aa7e-e17a6d8893d6"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d8428e82-bfa5-3b48-aa7e-e17a6d8893d6"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a7ffc43f-82d6-4794-889b-36e130c5b3cf"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-06-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:57:02.473029+00:00, try_number=1, job_id=711, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-18 00:00:00+00:00 +INFO - Started process 5870 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-06-18T00:00:00+00:00', '--job-id', '711', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpy820b8r3'] +INFO - Job 711: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499511f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005703Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005703Z +20221111/us-east-1/s3/aws4_request +d2853ff307c89433bc9af32ea3931164baacb95ea6e40872611add6c127808f8 +INFO - '2022-11-11' - botocore.auth - Signature: +b27cc74ed0563e10dc31bbc3321947112cc04b44a29564bfb5eb322727b92ef0 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'mZum2W6OZjpgaqHD+LjsG+VuxbDWuzi18xXHwsbefNgYgZPZLevHsBF0irQRHSvCA/Z5lLLFJ4A=', 'x-amz-request-id': '8Y1A5FD178TVX7FK', 'Date': 'Fri, 11 Nov 2022 00:57:03 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180618T000000, start_date=20221111T005702, end_date=20221111T005704 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-06-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:57:04.346127Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a7ffc43f-82d6-4794-889b-36e130c5b3cf"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..e59fe2d8 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:56:57.770452Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d8428e82-bfa5-3b48-aa7e-e17a6d8893d6"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d8428e82-bfa5-3b48-aa7e-e17a6d8893d6"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1bc07a62-88c1-4748-a024-af564622362b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-06-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:56:57.770452+00:00, try_number=1, job_id=709, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-18 00:00:00+00:00 +INFO - Started process 5887 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-06-18T00:00:00+00:00', '--job-id', '709', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpdg2gy7pt'] +INFO - Job 709: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180618T000000, start_date=20221111T005657, end_date=20221111T005702 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-06-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:57:02.851724Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1bc07a62-88c1-4748-a024-af564622362b"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..a0dcec08 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:56:57.771028Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d8428e82-bfa5-3b48-aa7e-e17a6d8893d6"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d8428e82-bfa5-3b48-aa7e-e17a6d8893d6"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4dd0a724-6ef6-4562-8bce-dcbd750a4aa9"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-06-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:56:57.771028+00:00, try_number=1, job_id=710, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-18 00:00:00+00:00 +INFO - Started process 5886 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-06-18T00:00:00+00:00', '--job-id', '710', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpr2fa5iie'] +INFO - Job 710: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180618T000000, start_date=20221111T005657, end_date=20221111T005700 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-06-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:57:00.376712Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4dd0a724-6ef6-4562-8bce-dcbd750a4aa9"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..141c5ddd --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:57:08.517313Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "201e825a-0797-3bf8-9cb2-001f0d2d8427"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "201e825a-0797-3bf8-9cb2-001f0d2d8427"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ac0481ce-b9bc-4230-9d8d-cf2d0d161a0a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-06-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:57:08.517313+00:00, try_number=1, job_id=714, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-19 00:00:00+00:00 +INFO - Started process 5927 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-06-19T00:00:00+00:00', '--job-id', '714', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpkicvxnqu'] +INFO - Job 714: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180619T000000, start_date=20221111T005708, end_date=20221111T005711 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-06-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:57:11.601725Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ac0481ce-b9bc-4230-9d8d-cf2d0d161a0a"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..19a1f473 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:57:08.519038Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "201e825a-0797-3bf8-9cb2-001f0d2d8427"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "201e825a-0797-3bf8-9cb2-001f0d2d8427"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f3f95d86-2115-4703-b5b6-9e8ab83250fb"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-06-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:57:08.519038+00:00, try_number=1, job_id=713, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-19 00:00:00+00:00 +INFO - Started process 5935 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-06-19T00:00:00+00:00', '--job-id', '713', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpgvofg4ue'] +INFO - Job 713: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180619T000000, start_date=20221111T005708, end_date=20221111T005711 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-06-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:57:11.541883Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f3f95d86-2115-4703-b5b6-9e8ab83250fb"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..dc1d9af9 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:57:20.955952Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "201e825a-0797-3bf8-9cb2-001f0d2d8427"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "201e825a-0797-3bf8-9cb2-001f0d2d8427"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5b69dd71-6e35-49ff-9a35-820f7f0af0c6"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-06-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:57:20.955952+00:00, try_number=1, job_id=718, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-19 00:00:00+00:00 +INFO - Started process 5914 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-06-19T00:00:00+00:00', '--job-id', '718', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpl1jf4ycx'] +INFO - Job 718: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498efee0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '/qMvE4STIzwRAtKzypqBHg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:/qMvE4STIzwRAtKzypqBHg== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005721Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005721Z +20221111/us-east-1/s3/aws4_request +002573fb75bbb0f5b6f7f6899dd97c252779d4faa9baf888e46f3c134534198b +INFO - '2022-11-11' - botocore.auth - Signature: +18c490bef509a9ee1cf9b3e08b5bf5df94941300a72d0f17337c3419ba772b3a +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'vComwFmECxcDStNVLAf2JuxVK40ym6QfBOjINDymTssjI1ckRmhclAXhW/X82T1oNP8xgv7S70Y=', 'x-amz-request-id': 'YW3G8B3JCPAGCGSS', 'Date': 'Fri, 11 Nov 2022 00:57:22 GMT', 'ETag': '"fea32f138493233c1102d2b3ca9a811e"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180619T000000, start_date=20221111T005720, end_date=20221111T005722 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-06-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:57:22.830188Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5b69dd71-6e35-49ff-9a35-820f7f0af0c6"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..80259c27 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:57:18.127578Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "201e825a-0797-3bf8-9cb2-001f0d2d8427"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "201e825a-0797-3bf8-9cb2-001f0d2d8427"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d9c396ae-f376-4ed0-a6c1-ca830714fba1"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-06-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:57:18.127578+00:00, try_number=1, job_id=717, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-19 00:00:00+00:00 +INFO - Started process 5886 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-06-19T00:00:00+00:00', '--job-id', '717', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpe2_ugouq'] +INFO - Job 717: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499521f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005718Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005718Z +20221111/us-east-1/s3/aws4_request +33963e0ef4c21779867116b574ead0d777a41864d2beffbfed262c345e746f74 +INFO - '2022-11-11' - botocore.auth - Signature: +76d1ff2be449e5710cdc791ac1ff096bf7982c450eedce7024c4db624a880983 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'FQ/wLs2uBj/C6iTvqo1RlpVVDclQUzr+lEjwpIWlxiM87J45rLjLRC8MvzkSukIzCFg6oDXFLUw=', 'x-amz-request-id': 'W8C1WAH2FZBDXK9X', 'Date': 'Fri, 11 Nov 2022 00:57:19 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180619T000000, start_date=20221111T005718, end_date=20221111T005720 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-06-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:57:20.041397Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d9c396ae-f376-4ed0-a6c1-ca830714fba1"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..7d6ddcde --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:57:13.431217Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "201e825a-0797-3bf8-9cb2-001f0d2d8427"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "201e825a-0797-3bf8-9cb2-001f0d2d8427"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8e8f24ec-f644-4c4b-88bd-b48ca4b3df49"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-06-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:57:13.431217+00:00, try_number=1, job_id=716, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-19 00:00:00+00:00 +INFO - Started process 5881 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-06-19T00:00:00+00:00', '--job-id', '716', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpnftulqrl'] +INFO - Job 716: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180619T000000, start_date=20221111T005713, end_date=20221111T005718 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-06-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:57:18.630294Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8e8f24ec-f644-4c4b-88bd-b48ca4b3df49"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..903080ca --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:57:13.303826Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "201e825a-0797-3bf8-9cb2-001f0d2d8427"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "201e825a-0797-3bf8-9cb2-001f0d2d8427"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b0815e86-ecd8-4285-9f38-78b95cbbc252"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-06-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:57:13.303826+00:00, try_number=1, job_id=715, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-19 00:00:00+00:00 +INFO - Started process 5879 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-06-19T00:00:00+00:00', '--job-id', '715', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpxs9y3k3v'] +INFO - Job 715: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180619T000000, start_date=20221111T005713, end_date=20221111T005715 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-06-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:57:15.904456Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b0815e86-ecd8-4285-9f38-78b95cbbc252"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..9b662415 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:57:25.095254Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "24245d77-d966-3015-92d9-2334c1b4c7cf"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "24245d77-d966-3015-92d9-2334c1b4c7cf"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b1712591-30b5-4ad3-b429-87aaea279de0"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-06-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:57:25.095254+00:00, try_number=1, job_id=719, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-20 00:00:00+00:00 +INFO - Started process 5970 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-06-20T00:00:00+00:00', '--job-id', '719', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp5bfp__p8'] +INFO - Job 719: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180620T000000, start_date=20221111T005725, end_date=20221111T005728 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-06-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:57:28.114744Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b1712591-30b5-4ad3-b429-87aaea279de0"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..9f515b20 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:57:25.090726Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "24245d77-d966-3015-92d9-2334c1b4c7cf"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "24245d77-d966-3015-92d9-2334c1b4c7cf"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e53314e0-fd14-443e-b983-6ba5367c1913"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-06-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:57:25.090726+00:00, try_number=1, job_id=720, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-20 00:00:00+00:00 +INFO - Started process 5967 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-06-20T00:00:00+00:00', '--job-id', '720', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpbxz2vvb9'] +INFO - Job 720: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180620T000000, start_date=20221111T005725, end_date=20221111T005729 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-06-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:57:29.460232Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e53314e0-fd14-443e-b983-6ba5367c1913"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..e8da22ef --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:57:36.370803Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "24245d77-d966-3015-92d9-2334c1b4c7cf"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "24245d77-d966-3015-92d9-2334c1b4c7cf"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1cc627b4-91af-45ea-9999-2ffa884abc05"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-06-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:57:36.370803+00:00, try_number=1, job_id=724, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-20 00:00:00+00:00 +INFO - Started process 5980 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-06-20T00:00:00+00:00', '--job-id', '724', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpi596_e2q'] +INFO - Job 724: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498eff70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '/qMvE4STIzwRAtKzypqBHg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:/qMvE4STIzwRAtKzypqBHg== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005737Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005737Z +20221111/us-east-1/s3/aws4_request +fdcfdc61d4d589cbb0b348078990085fc6fc320061fcfdea4f420808b7d3046f +INFO - '2022-11-11' - botocore.auth - Signature: +6f057c7742af1eaefa907716af8fe0592b61b9675ffe95e92a26278dc74b3bbf +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'cDix3Q+v6ox6x3lMno3GK3aXBuOpONCqTbPf39ARXN/GxEeRX+6cvDvJlWkr82gsodmKZyUgMfQ=', 'x-amz-request-id': '0G65VPB59BV38HV8', 'Date': 'Fri, 11 Nov 2022 00:57:37 GMT', 'ETag': '"fea32f138493233c1102d2b3ca9a811e"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180620T000000, start_date=20221111T005736, end_date=20221111T005738 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-06-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:57:38.448416Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1cc627b4-91af-45ea-9999-2ffa884abc05"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..87b699c6 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:57:36.356081Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "24245d77-d966-3015-92d9-2334c1b4c7cf"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "24245d77-d966-3015-92d9-2334c1b4c7cf"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a1b89b03-87f2-4438-a19a-0c2dfd62ebdf"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-06-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:57:36.356081+00:00, try_number=1, job_id=723, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-20 00:00:00+00:00 +INFO - Started process 5978 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-06-20T00:00:00+00:00', '--job-id', '723', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpsv96jt9y'] +INFO - Job 723: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498eff70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005737Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005737Z +20221111/us-east-1/s3/aws4_request +ed3c1c77d827d317f98aadbb41878280ea4ad8729b6c09375134a22bf3086864 +INFO - '2022-11-11' - botocore.auth - Signature: +928d5ef4c8aa5d761e8f3273c56219127a31c22ff9734d542aa4a7be8b8587f0 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'LOKDRDfz/b1hbMnBbWv0cdVD2/0v64KKjUD5lCmERGSjvhM4Hqfty5QKJxf2+3nHset5f4RsEC8=', 'x-amz-request-id': '0G69MRJVWT7BQBWJ', 'Date': 'Fri, 11 Nov 2022 00:57:37 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180620T000000, start_date=20221111T005736, end_date=20221111T005738 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-06-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:57:38.496920Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a1b89b03-87f2-4438-a19a-0c2dfd62ebdf"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..2ab16c80 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:57:29.585972Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "24245d77-d966-3015-92d9-2334c1b4c7cf"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "24245d77-d966-3015-92d9-2334c1b4c7cf"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "74323508-1203-4321-8788-348e8eedde27"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-06-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:57:29.585972+00:00, try_number=1, job_id=721, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-20 00:00:00+00:00 +INFO - Started process 5975 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-06-20T00:00:00+00:00', '--job-id', '721', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpnf_iftsy'] +INFO - Job 721: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180620T000000, start_date=20221111T005729, end_date=20221111T005734 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-06-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:57:34.503401Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "74323508-1203-4321-8788-348e8eedde27"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..3ff47b92 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:57:31.282096Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "24245d77-d966-3015-92d9-2334c1b4c7cf"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "24245d77-d966-3015-92d9-2334c1b4c7cf"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ca618d3c-64cb-4a5a-befc-98cdcf7aed8e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-06-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:57:31.282096+00:00, try_number=1, job_id=722, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-20 00:00:00+00:00 +INFO - Started process 5979 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-06-20T00:00:00+00:00', '--job-id', '722', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp4fv5otwz'] +INFO - Job 722: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180620T000000, start_date=20221111T005731, end_date=20221111T005734 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-06-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:57:34.285493Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ca618d3c-64cb-4a5a-befc-98cdcf7aed8e"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..0d6e36d8 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:57:40.854790Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e8039834-ea7c-32f9-b375-0f5f82c81088"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e8039834-ea7c-32f9-b375-0f5f82c81088"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5a855c4c-72fc-4198-ba56-a43295d7688e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-06-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:57:40.854790+00:00, try_number=1, job_id=726, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-21 00:00:00+00:00 +INFO - Started process 5994 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-06-21T00:00:00+00:00', '--job-id', '726', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpkzxhjyx5'] +INFO - Job 726: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180621T000000, start_date=20221111T005740, end_date=20221111T005744 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-06-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:57:44.227850Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5a855c4c-72fc-4198-ba56-a43295d7688e"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..bf3ae780 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:57:40.797551Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e8039834-ea7c-32f9-b375-0f5f82c81088"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e8039834-ea7c-32f9-b375-0f5f82c81088"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a0e642a0-d29f-407e-b663-350d297d6600"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-06-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:57:40.797551+00:00, try_number=1, job_id=725, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-21 00:00:00+00:00 +INFO - Started process 5992 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-06-21T00:00:00+00:00', '--job-id', '725', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp4gpwp9gn'] +INFO - Job 725: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180621T000000, start_date=20221111T005740, end_date=20221111T005744 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-06-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:57:44.302113Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a0e642a0-d29f-407e-b663-350d297d6600"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..b9e219df --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:57:54.517123Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e8039834-ea7c-32f9-b375-0f5f82c81088"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e8039834-ea7c-32f9-b375-0f5f82c81088"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "14a45d01-7e2b-4b44-9940-b40c890f4bc9"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-06-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:57:54.517123+00:00, try_number=1, job_id=730, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-21 00:00:00+00:00 +INFO - Started process 6060 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-06-21T00:00:00+00:00', '--job-id', '730', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpuvxo6943'] +INFO - Job 730: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'y/Z84e/XjrujHpOYKrM3Dg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:y/Z84e/XjrujHpOYKrM3Dg== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005755Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005755Z +20221111/us-east-1/s3/aws4_request +c963130a1ec7caa13a386ac8e24a8695efbffd54c04f1f3c7a9529f758232ec8 +INFO - '2022-11-11' - botocore.auth - Signature: +312edd6f7e3a981203a552aa98f104e1b55ce3c1886cede6bef28b56bf207214 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'BjeloXQVzQ+6as5aOQh8iMW6hiH4rDnPFAGDEuDw1gWWhI3222obLDe5ZyJDVIUuWTR1TmzotxY=', 'x-amz-request-id': 'ZJ031ZPSPZZRY400', 'Date': 'Fri, 11 Nov 2022 00:57:56 GMT', 'ETag': '"cbf67ce1efd78ebba31e93982ab3370e"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180621T000000, start_date=20221111T005754, end_date=20221111T005756 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-06-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:57:56.709978Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "14a45d01-7e2b-4b44-9940-b40c890f4bc9"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..1bdfc7be --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:57:51.097837Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e8039834-ea7c-32f9-b375-0f5f82c81088"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e8039834-ea7c-32f9-b375-0f5f82c81088"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ed48aaf2-107a-4728-afba-4e3252572502"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-06-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:57:51.097837+00:00, try_number=1, job_id=729, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-21 00:00:00+00:00 +INFO - Started process 6000 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-06-21T00:00:00+00:00', '--job-id', '729', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp9scb4t51'] +INFO - Job 729: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499531f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005752Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005752Z +20221111/us-east-1/s3/aws4_request +cd9ba1dc897c6581146dace81d3fa0e54175ea5e5af6131efbd517c22f428f83 +INFO - '2022-11-11' - botocore.auth - Signature: +fc3479a581fc98f196520e1bcd224682225c0bdf06fd70755c81f27146435ca6 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'LZchEialf6p9rrsytHKmMzQKnkES65ymW+iC9cdmJ3YdrV37RfBMWYavmJCUXCmGf/tWaBVs+1M=', 'x-amz-request-id': '3NZ3NN9MPV1GV89M', 'Date': 'Fri, 11 Nov 2022 00:57:52 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180621T000000, start_date=20221111T005751, end_date=20221111T005753 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-06-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:57:53.156171Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ed48aaf2-107a-4728-afba-4e3252572502"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..e8017a1d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:57:46.043474Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e8039834-ea7c-32f9-b375-0f5f82c81088"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e8039834-ea7c-32f9-b375-0f5f82c81088"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2766d22a-ecb2-4734-a9ea-b548fb82eecb"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-06-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:57:46.043474+00:00, try_number=1, job_id=728, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-21 00:00:00+00:00 +INFO - Started process 6054 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-06-21T00:00:00+00:00', '--job-id', '728', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpn0iqwxbm'] +INFO - Job 728: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180621T000000, start_date=20221111T005746, end_date=20221111T005751 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-06-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:57:51.936613Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2766d22a-ecb2-4734-a9ea-b548fb82eecb"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..e8c8601d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:57:46.003646Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e8039834-ea7c-32f9-b375-0f5f82c81088"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e8039834-ea7c-32f9-b375-0f5f82c81088"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "aac33700-a2d9-4836-a310-7efd1fba8a27"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-06-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:57:46.003646+00:00, try_number=1, job_id=727, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-21 00:00:00+00:00 +INFO - Started process 6052 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-06-21T00:00:00+00:00', '--job-id', '727', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp4z_kvmgn'] +INFO - Job 727: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180621T000000, start_date=20221111T005746, end_date=20221111T005748 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-06-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:57:48.901522Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "aac33700-a2d9-4836-a310-7efd1fba8a27"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..3594b374 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:57:59.017738Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "080ae0ce-c7fb-31c5-850e-2d9491fbcc65"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "080ae0ce-c7fb-31c5-850e-2d9491fbcc65"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "59d5cfa0-98cd-405a-be77-bf7f31884322"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-06-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:57:59.017738+00:00, try_number=1, job_id=732, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-22 00:00:00+00:00 +INFO - Started process 6071 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-06-22T00:00:00+00:00', '--job-id', '732', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmphkqkglnu'] +INFO - Job 732: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180622T000000, start_date=20221111T005759, end_date=20221111T005801 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-06-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:58:01.769437Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "59d5cfa0-98cd-405a-be77-bf7f31884322"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..9136eb67 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:57:58.998566Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "080ae0ce-c7fb-31c5-850e-2d9491fbcc65"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "080ae0ce-c7fb-31c5-850e-2d9491fbcc65"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0e47fd37-ce77-41df-8636-166514dac22b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-06-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:57:58.998566+00:00, try_number=1, job_id=731, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-22 00:00:00+00:00 +INFO - Started process 6069 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-06-22T00:00:00+00:00', '--job-id', '731', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp6plfzp1q'] +INFO - Job 731: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180622T000000, start_date=20221111T005758, end_date=20221111T005801 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-06-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:58:01.916871Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0e47fd37-ce77-41df-8636-166514dac22b"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..2e1fcf06 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:58:11.753880Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "080ae0ce-c7fb-31c5-850e-2d9491fbcc65"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "080ae0ce-c7fb-31c5-850e-2d9491fbcc65"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b4fa823a-18a4-44e1-8af0-7d7c41d1b0fe"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-06-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:58:11.753880+00:00, try_number=1, job_id=736, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-22 00:00:00+00:00 +INFO - Started process 6089 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-06-22T00:00:00+00:00', '--job-id', '736', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpo80yz6w7'] +INFO - Job 736: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f2f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '+qczihmEdiLFGRWoitd+hg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:+qczihmEdiLFGRWoitd+hg== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005812Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005812Z +20221111/us-east-1/s3/aws4_request +98a1a100d8e35c066776c764eb00011a03a163c8c1e640f9575899f1e3b9a069 +INFO - '2022-11-11' - botocore.auth - Signature: +e2d1df8032b3b739b911137eae667ed819f2ac007fc4d22ead1a33130de23597 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'LZoQj+QW26OmJuMD5pBxe50toXmQI8SrBrtrCsHGgXnt1x0lO2aTU7logufs5FbTwsm0J4sbshk=', 'x-amz-request-id': 'TTAGSVR3KNMCZPTC', 'Date': 'Fri, 11 Nov 2022 00:58:13 GMT', 'ETag': '"faa7338a19847622c51915a88ad77e86"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180622T000000, start_date=20221111T005811, end_date=20221111T005813 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-06-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:58:13.886671Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b4fa823a-18a4-44e1-8af0-7d7c41d1b0fe"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..5cc76ee0 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:58:07.994769Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "080ae0ce-c7fb-31c5-850e-2d9491fbcc65"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "080ae0ce-c7fb-31c5-850e-2d9491fbcc65"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "644696a8-389b-44fb-b2e5-354a4d50a23e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-06-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:58:07.994769+00:00, try_number=1, job_id=735, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-22 00:00:00+00:00 +INFO - Started process 6081 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-06-22T00:00:00+00:00', '--job-id', '735', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp3wlyy5jz'] +INFO - Job 735: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499543a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005809Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005809Z +20221111/us-east-1/s3/aws4_request +3ef8b5b6c9c1cfca6f16d101e550f5e9091939126ec1e103f47bff5c7c661384 +INFO - '2022-11-11' - botocore.auth - Signature: +890604a3bddd8c9b393d486e010f23d849bc09104e8b2ce10a58311711dc451d +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'MzTBjAn8OuxVa4DJ6uj03KCZt0fPttwd1WQSXgg0pSi1LcJUczitGwPNmsni7L7hZ7B2NE/kXmrZLIWFY2ReAg==', 'x-amz-request-id': 'A0ZTWYH0XSY0R3B1', 'Date': 'Fri, 11 Nov 2022 00:58:09 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180622T000000, start_date=20221111T005807, end_date=20221111T005810 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-06-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:58:10.282494Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "644696a8-389b-44fb-b2e5-354a4d50a23e"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..d6758725 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:58:03.544093Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "080ae0ce-c7fb-31c5-850e-2d9491fbcc65"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "080ae0ce-c7fb-31c5-850e-2d9491fbcc65"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "af7b2019-2b53-4d73-8173-d455704ebb43"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-06-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:58:03.544093+00:00, try_number=1, job_id=734, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-22 00:00:00+00:00 +INFO - Started process 6076 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-06-22T00:00:00+00:00', '--job-id', '734', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpwqizpes3'] +INFO - Job 734: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180622T000000, start_date=20221111T005803, end_date=20221111T005809 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-06-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:58:09.705925Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "af7b2019-2b53-4d73-8173-d455704ebb43"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..54c93867 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:58:03.514958Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "080ae0ce-c7fb-31c5-850e-2d9491fbcc65"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "080ae0ce-c7fb-31c5-850e-2d9491fbcc65"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bcaf59cb-a779-48fc-bf9b-a9ff21ba5a83"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-06-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:58:03.514958+00:00, try_number=1, job_id=733, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-22 00:00:00+00:00 +INFO - Started process 6074 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-06-22T00:00:00+00:00', '--job-id', '733', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmptnvvja80'] +INFO - Job 733: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180622T000000, start_date=20221111T005803, end_date=20221111T005806 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-06-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:58:06.309758Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bcaf59cb-a779-48fc-bf9b-a9ff21ba5a83"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..fb3a6583 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:58:15.802975Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f9ce46da-438a-3eb7-a6d4-9f9834cac15f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f9ce46da-438a-3eb7-a6d4-9f9834cac15f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a7926dc3-d77e-49fc-8586-e458a7eef1d2"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-06-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:58:15.802975+00:00, try_number=1, job_id=738, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-23 00:00:00+00:00 +INFO - Started process 6097 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-06-23T00:00:00+00:00', '--job-id', '738', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpp85q1f9j'] +INFO - Job 738: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-23T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180623T000000, start_date=20221111T005815, end_date=20221111T005818 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-06-23T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:58:18.703513Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a7926dc3-d77e-49fc-8586-e458a7eef1d2"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..7ce4f394 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:58:15.809101Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f9ce46da-438a-3eb7-a6d4-9f9834cac15f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f9ce46da-438a-3eb7-a6d4-9f9834cac15f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0ab7705e-b3ef-4eb9-b6e9-e7e9dde70f92"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-06-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:58:15.809101+00:00, try_number=1, job_id=737, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-23 00:00:00+00:00 +INFO - Started process 6100 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-06-23T00:00:00+00:00', '--job-id', '737', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpnkuc675h'] +INFO - Job 737: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-23T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180623T000000, start_date=20221111T005815, end_date=20221111T005818 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-06-23T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:58:18.709874Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0ab7705e-b3ef-4eb9-b6e9-e7e9dde70f92"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..ba97dd22 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:58:27.933232Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f9ce46da-438a-3eb7-a6d4-9f9834cac15f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f9ce46da-438a-3eb7-a6d4-9f9834cac15f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ad0a33c7-9d86-47bb-b38d-da6e93c2c446"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-06-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:58:27.933232+00:00, try_number=1, job_id=742, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-23 00:00:00+00:00 +INFO - Started process 6178 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-06-23T00:00:00+00:00', '--job-id', '742', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp3yvz5nn8'] +INFO - Job 742: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-23T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498eff70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '+qczihmEdiLFGRWoitd+hg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:+qczihmEdiLFGRWoitd+hg== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005828Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005828Z +20221111/us-east-1/s3/aws4_request +203ac66cebaf2daba8a48f802310b50b0fe123ba791f7e481d9598a36fc8bcd4 +INFO - '2022-11-11' - botocore.auth - Signature: +f99485d4ebf39519617be4a697c00e0ae372412793cebdfd7454a30ff86124a8 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '38yF90dgYrajJSN22+QUsFd5ZAE+2nOLfQCuf2eLCSSyzqrGIAnFFr5qrKqEv3B2zdg7Xkdz5VE=', 'x-amz-request-id': 'S4K9VD5N2GEMAWWH', 'Date': 'Fri, 11 Nov 2022 00:58:29 GMT', 'ETag': '"faa7338a19847622c51915a88ad77e86"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180623T000000, start_date=20221111T005827, end_date=20221111T005829 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-06-23T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:58:29.689734Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ad0a33c7-9d86-47bb-b38d-da6e93c2c446"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..b8280c8d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:58:25.675254Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f9ce46da-438a-3eb7-a6d4-9f9834cac15f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f9ce46da-438a-3eb7-a6d4-9f9834cac15f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "dae01dc2-99bc-49be-ab74-99d298d8f97f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-06-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:58:25.675254+00:00, try_number=1, job_id=741, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-23 00:00:00+00:00 +INFO - Started process 6155 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-06-23T00:00:00+00:00', '--job-id', '741', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpxihe676w'] +INFO - Job 741: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-23T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499543a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005826Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005826Z +20221111/us-east-1/s3/aws4_request +24897792c2bc9e66b49462901c66a3ebb5cf1cbb0f4fe645d9fc274e7fadd55c +INFO - '2022-11-11' - botocore.auth - Signature: +0621ad41945e3d15105da9adff7bd76f0a5e9fd607c3a0b502cb4d7fcf385810 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'toOpE+1RTHovzj+teJVDyBIRtjNMNKy6T9HGkeNNrSFj3Qpm0WGB4I60V51yPxiUfcqTr4GOM1I=', 'x-amz-request-id': 'VZGB5TTTA89DZV2V', 'Date': 'Fri, 11 Nov 2022 00:58:27 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180623T000000, start_date=20221111T005825, end_date=20221111T005828 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-06-23T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:58:28.058225Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "dae01dc2-99bc-49be-ab74-99d298d8f97f"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..4a52e45e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:58:20.474381Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f9ce46da-438a-3eb7-a6d4-9f9834cac15f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f9ce46da-438a-3eb7-a6d4-9f9834cac15f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "83527d81-499e-46a0-9dc7-337779bd090e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-06-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:58:20.474381+00:00, try_number=1, job_id=739, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-23 00:00:00+00:00 +INFO - Started process 6144 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-06-23T00:00:00+00:00', '--job-id', '739', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp4u5cj2sm'] +INFO - Job 739: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-23T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180623T000000, start_date=20221111T005820, end_date=20221111T005826 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-06-23T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:58:26.613381Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "83527d81-499e-46a0-9dc7-337779bd090e"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..892e9408 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:58:20.504450Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f9ce46da-438a-3eb7-a6d4-9f9834cac15f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "f9ce46da-438a-3eb7-a6d4-9f9834cac15f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "106c5aef-61b7-45bb-ae3a-17d8e83a0cab"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-06-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:58:20.504450+00:00, try_number=1, job_id=740, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-23 00:00:00+00:00 +INFO - Started process 6146 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-06-23T00:00:00+00:00', '--job-id', '740', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp7dodn6mq'] +INFO - Job 740: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-23T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180623T000000, start_date=20221111T005820, end_date=20221111T005823 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-06-23T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:58:23.321734Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "106c5aef-61b7-45bb-ae3a-17d8e83a0cab"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..6f24ced5 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:58:32.247957Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c70034c9-0eb4-351a-9f3b-914ce9914f2e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c70034c9-0eb4-351a-9f3b-914ce9914f2e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "28093127-39b4-41d6-9a4e-32b69c310321"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-06-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:58:32.247957+00:00, try_number=1, job_id=743, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-24 00:00:00+00:00 +INFO - Started process 6189 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-06-24T00:00:00+00:00', '--job-id', '743', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpdfduqd_c'] +INFO - Job 743: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-24T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180624T000000, start_date=20221111T005832, end_date=20221111T005834 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-06-24T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:58:34.938791Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "28093127-39b4-41d6-9a4e-32b69c310321"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..9123cd6d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:58:32.250364Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c70034c9-0eb4-351a-9f3b-914ce9914f2e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c70034c9-0eb4-351a-9f3b-914ce9914f2e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d466fccd-586f-4bb0-aeba-4e079c53cba5"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-06-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:58:32.250364+00:00, try_number=1, job_id=744, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-24 00:00:00+00:00 +INFO - Started process 6186 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-06-24T00:00:00+00:00', '--job-id', '744', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpfeetzvt9'] +INFO - Job 744: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-24T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180624T000000, start_date=20221111T005832, end_date=20221111T005835 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-06-24T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:58:35.043453Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d466fccd-586f-4bb0-aeba-4e079c53cba5"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..ee7ae06c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:58:44.766918Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c70034c9-0eb4-351a-9f3b-914ce9914f2e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c70034c9-0eb4-351a-9f3b-914ce9914f2e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "45e77475-51f5-4e2e-b84e-32beee92593d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-06-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:58:44.766918+00:00, try_number=1, job_id=748, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-24 00:00:00+00:00 +INFO - Started process 6195 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-06-24T00:00:00+00:00', '--job-id', '748', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpp0s8dxa9'] +INFO - Job 748: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-24T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '+qczihmEdiLFGRWoitd+hg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:+qczihmEdiLFGRWoitd+hg== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005845Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005845Z +20221111/us-east-1/s3/aws4_request +928e8196bbd0c5d7f7ac4e6bfd21b957d20e3d225facd0d2a532d76665e3ecf5 +INFO - '2022-11-11' - botocore.auth - Signature: +f4d6168b8dbf932f476ffc3eb2aae04c9e9ce230e81ad67dd98d788fc020330d +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '7KrFhw6BaoGEoM/nllO85DDLn4MIyBdhWBxP0AHxdO4DZR/o672LySdyDtFiF+qpYj0571IWWrE=', 'x-amz-request-id': 'PNXZYEJJC4TDVEEQ', 'Date': 'Fri, 11 Nov 2022 00:58:46 GMT', 'ETag': '"faa7338a19847622c51915a88ad77e86"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180624T000000, start_date=20221111T005844, end_date=20221111T005846 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-06-24T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:58:46.919376Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "45e77475-51f5-4e2e-b84e-32beee92593d"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..06722e67 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:58:42.304853Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c70034c9-0eb4-351a-9f3b-914ce9914f2e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c70034c9-0eb4-351a-9f3b-914ce9914f2e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "dc8d7838-fa56-495d-9d26-6b752ab2345f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-06-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:58:42.304853+00:00, try_number=1, job_id=747, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-24 00:00:00+00:00 +INFO - Started process 6195 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-06-24T00:00:00+00:00', '--job-id', '747', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpnn2z55xu'] +INFO - Job 747: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-24T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50073a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005843Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005843Z +20221111/us-east-1/s3/aws4_request +4f7fdc2ebd2b87fbf79fa09a89d768f5067537d067b8d0fc671c6125745173f9 +INFO - '2022-11-11' - botocore.auth - Signature: +47ec34d65090663fed5ecabd68ac652ab6d0c91d764e2cee274af55650bd1315 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'K4sm8t8LdL5LD1qCWJPPhkCBkd0rq7CL2MCEuD/6U+B8+HpFXisA93PhuRL0HbeNmIeXXvNSpRY=', 'x-amz-request-id': 'JHWH0KBJQY70MAAB', 'Date': 'Fri, 11 Nov 2022 00:58:44 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180624T000000, start_date=20221111T005842, end_date=20221111T005844 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-06-24T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:58:44.743837Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "dc8d7838-fa56-495d-9d26-6b752ab2345f"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..832fc544 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:58:36.895786Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c70034c9-0eb4-351a-9f3b-914ce9914f2e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c70034c9-0eb4-351a-9f3b-914ce9914f2e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "70703f7a-d3b8-4fce-ad4b-020a7032c168"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-06-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:58:36.895786+00:00, try_number=1, job_id=746, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-24 00:00:00+00:00 +INFO - Started process 6156 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-06-24T00:00:00+00:00', '--job-id', '746', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpuu9_c5ij'] +INFO - Job 746: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-24T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180624T000000, start_date=20221111T005836, end_date=20221111T005843 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-06-24T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:58:43.105380Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "70703f7a-d3b8-4fce-ad4b-020a7032c168"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..51ac1eb9 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:58:36.890115Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c70034c9-0eb4-351a-9f3b-914ce9914f2e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c70034c9-0eb4-351a-9f3b-914ce9914f2e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e80e8127-9431-43bb-b41e-324fade288cd"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-06-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:58:36.890115+00:00, try_number=1, job_id=745, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-24 00:00:00+00:00 +INFO - Started process 6155 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-06-24T00:00:00+00:00', '--job-id', '745', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpeooct0zc'] +INFO - Job 745: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-24T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180624T000000, start_date=20221111T005836, end_date=20221111T005839 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-06-24T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:58:39.736396Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e80e8127-9431-43bb-b41e-324fade288cd"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..3b69abd5 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:58:48.822971Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e5db4793-c4bb-3378-b463-f80c69094391"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e5db4793-c4bb-3378-b463-f80c69094391"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "927ac93b-c994-4824-83a7-b74900966892"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-06-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:58:48.822971+00:00, try_number=1, job_id=749, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-25 00:00:00+00:00 +INFO - Started process 6204 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-06-25T00:00:00+00:00', '--job-id', '749', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpzl1b14t5'] +INFO - Job 749: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-25T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180625T000000, start_date=20221111T005848, end_date=20221111T005851 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-06-25T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:58:51.605093Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "927ac93b-c994-4824-83a7-b74900966892"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..bbc08df7 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:58:48.915449Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e5db4793-c4bb-3378-b463-f80c69094391"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e5db4793-c4bb-3378-b463-f80c69094391"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "54e17f00-a4c3-4f5d-ac92-70be1ec404a1"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-06-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:58:48.915449+00:00, try_number=1, job_id=750, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-25 00:00:00+00:00 +INFO - Started process 6206 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-06-25T00:00:00+00:00', '--job-id', '750', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpv96bz_cy'] +INFO - Job 750: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-25T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180625T000000, start_date=20221111T005848, end_date=20221111T005851 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-06-25T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:58:51.592813Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "54e17f00-a4c3-4f5d-ac92-70be1ec404a1"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..fb983dba --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:59:01.389238Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e5db4793-c4bb-3378-b463-f80c69094391"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e5db4793-c4bb-3378-b463-f80c69094391"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2ecc001f-4f78-4d7b-8a0e-61080c639f59"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-06-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:59:01.389238+00:00, try_number=1, job_id=754, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-25 00:00:00+00:00 +INFO - Started process 6284 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-06-25T00:00:00+00:00', '--job-id', '754', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpy0kf9s77'] +INFO - Job 754: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-25T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f1f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '+qczihmEdiLFGRWoitd+hg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:+qczihmEdiLFGRWoitd+hg== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005902Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005902Z +20221111/us-east-1/s3/aws4_request +772d76ad10a8753084e4f685a457f77f1909362839c17f029383141ec487ab43 +INFO - '2022-11-11' - botocore.auth - Signature: +dfe3100b66d5ebbd0f0217852b7dd3a119732043d798b0abbee47e22f5ca9078 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'I9eGIBmmIuwb1vnK4o38YYMnIVWedA8JFO4tBVgUVvhW8G/XGUWjj/GoDVdoZ4pkZ/JBPxeMuJg=', 'x-amz-request-id': 'MV09BKZQ420V41WM', 'Date': 'Fri, 11 Nov 2022 00:59:02 GMT', 'ETag': '"faa7338a19847622c51915a88ad77e86"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180625T000000, start_date=20221111T005901, end_date=20221111T005903 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-06-25T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:59:03.391483Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2ecc001f-4f78-4d7b-8a0e-61080c639f59"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..f025b712 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:58:58.058264Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e5db4793-c4bb-3378-b463-f80c69094391"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e5db4793-c4bb-3378-b463-f80c69094391"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cf998cb0-de4d-4748-b61e-c58b98038097"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-06-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:58:58.058264+00:00, try_number=1, job_id=753, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-25 00:00:00+00:00 +INFO - Started process 6277 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-06-25T00:00:00+00:00', '--job-id', '753', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpudw6hov7'] +INFO - Job 753: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-25T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499521f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005858Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005858Z +20221111/us-east-1/s3/aws4_request +fccad0c86dc3cad2304f9ff9a59fad57936c52ab616182f253c2dd4a654275d7 +INFO - '2022-11-11' - botocore.auth - Signature: +216122b39503d4f619bb650a66aba5844dc896b0454955c0f0cf665e1e247e5b +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '0heCfDaFVlFoprnCHTczG9Bu1v89yLAiolB7s8U1LIexDpggh24FaEkIO2JBMMIzzxBjxP9r1k8=', 'x-amz-request-id': 'DVTPB36165AEM7BX', 'Date': 'Fri, 11 Nov 2022 00:58:59 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180625T000000, start_date=20221111T005858, end_date=20221111T005900 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-06-25T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:59:00.132168Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cf998cb0-de4d-4748-b61e-c58b98038097"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..ea435e18 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:58:53.546472Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e5db4793-c4bb-3378-b463-f80c69094391"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e5db4793-c4bb-3378-b463-f80c69094391"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6a1e67b9-423e-4760-922b-1e4117e0214d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-06-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:58:53.546472+00:00, try_number=1, job_id=752, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-25 00:00:00+00:00 +INFO - Started process 6238 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-06-25T00:00:00+00:00', '--job-id', '752', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpptwy932f'] +INFO - Job 752: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-25T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180625T000000, start_date=20221111T005853, end_date=20221111T005859 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-06-25T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:58:59.868329Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6a1e67b9-423e-4760-922b-1e4117e0214d"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..cdba64bb --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:58:53.492800Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e5db4793-c4bb-3378-b463-f80c69094391"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e5db4793-c4bb-3378-b463-f80c69094391"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9fcd4701-2f20-4468-b14b-90595bca08fb"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-06-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:58:53.492800+00:00, try_number=1, job_id=751, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-25 00:00:00+00:00 +INFO - Started process 6236 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-06-25T00:00:00+00:00', '--job-id', '751', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpqcwiytmo'] +INFO - Job 751: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-25T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180625T000000, start_date=20221111T005853, end_date=20221111T005856 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-06-25T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:58:56.115787Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9fcd4701-2f20-4468-b14b-90595bca08fb"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..cfa11f63 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:59:05.139192Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c9bdf132-4e71-3179-8515-d58a137e877a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c9bdf132-4e71-3179-8515-d58a137e877a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1ecd935f-af85-421a-bcc4-c1b770d8998e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-06-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:59:05.139192+00:00, try_number=1, job_id=756, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-26 00:00:00+00:00 +INFO - Started process 6248 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-06-26T00:00:00+00:00', '--job-id', '756', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp5abm8ufl'] +INFO - Job 756: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-26T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180626T000000, start_date=20221111T005905, end_date=20221111T005910 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-06-26T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:59:10.057375Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1ecd935f-af85-421a-bcc4-c1b770d8998e"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..04baf8a2 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:59:05.137399Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c9bdf132-4e71-3179-8515-d58a137e877a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c9bdf132-4e71-3179-8515-d58a137e877a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e271dd70-fac6-4582-a37a-d8a457b879a9"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-06-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:59:05.137399+00:00, try_number=1, job_id=755, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-26 00:00:00+00:00 +INFO - Started process 6245 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-06-26T00:00:00+00:00', '--job-id', '755', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp4gkj30ba'] +INFO - Job 755: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-26T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180626T000000, start_date=20221111T005905, end_date=20221111T005908 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-06-26T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:59:08.415603Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e271dd70-fac6-4582-a37a-d8a457b879a9"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..1c64d061 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:59:20.156658Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c9bdf132-4e71-3179-8515-d58a137e877a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c9bdf132-4e71-3179-8515-d58a137e877a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "75bdd654-0c29-4779-8a4c-a2e73d190e1d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-06-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:59:20.156658+00:00, try_number=1, job_id=760, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-26 00:00:00+00:00 +INFO - Started process 6308 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-06-26T00:00:00+00:00', '--job-id', '760', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp70a1oatr'] +INFO - Job 760: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-26T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498eef70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'JcZSfwttHEt3q4xlWx6w9Q==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:JcZSfwttHEt3q4xlWx6w9Q== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005920Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005920Z +20221111/us-east-1/s3/aws4_request +ce32c51a64df5daa40c0b0b7a47404a8fd203f12e3d1addf232c6687c073b295 +INFO - '2022-11-11' - botocore.auth - Signature: +0b6c680f79ed73024936e2549ce3167d655d42a9f036bb16e1a192741691d3f4 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'm+f/7h/jAjeVsmpdbhEiEHz2ijW8YXJIkwNzdvf3+tGd43beMJedC5A5uXQams9xaa4I6LUvNJI=', 'x-amz-request-id': 'WAVJC83QGTZHKXJ1', 'Date': 'Fri, 11 Nov 2022 00:59:21 GMT', 'ETag': '"25c6527f0b6d1c4b77ab8c655b1eb0f5"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180626T000000, start_date=20221111T005920, end_date=20221111T005921 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-06-26T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:59:21.949843Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "75bdd654-0c29-4779-8a4c-a2e73d190e1d"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..5da822dd --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:59:15.106726Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c9bdf132-4e71-3179-8515-d58a137e877a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c9bdf132-4e71-3179-8515-d58a137e877a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d831296a-dfba-4f0d-a7b1-ad1baea7c10d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-06-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:59:15.106726+00:00, try_number=1, job_id=759, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-26 00:00:00+00:00 +INFO - Started process 6300 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-06-26T00:00:00+00:00', '--job-id', '759', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpttagr7vj'] +INFO - Job 759: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-26T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499511f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005916Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005916Z +20221111/us-east-1/s3/aws4_request +3bd8823ae08301e6e6f87759282aad090844737af871d2e7e8f258cdac778a5c +INFO - '2022-11-11' - botocore.auth - Signature: +41b5eca5ab052a1677ad683583c98a75ab23f82d79b234e40b29e431789748d6 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'sX8MT+0/HCtYkfYqtO5QWhyy4tLsDa4rC8BQgzQ92iaH/dyT+aK9+Z2IflD+CxWsB0iBGGP7HMs=', 'x-amz-request-id': 'NRN467BRA4ZVENPT', 'Date': 'Fri, 11 Nov 2022 00:59:16 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180626T000000, start_date=20221111T005915, end_date=20221111T005917 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-06-26T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:59:17.328596Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d831296a-dfba-4f0d-a7b1-ad1baea7c10d"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..e40517f7 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:59:11.840791Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c9bdf132-4e71-3179-8515-d58a137e877a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c9bdf132-4e71-3179-8515-d58a137e877a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "da0ac867-e422-4209-9477-00f64a119c0b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-06-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:59:11.840791+00:00, try_number=1, job_id=758, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-26 00:00:00+00:00 +INFO - Started process 6295 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-06-26T00:00:00+00:00', '--job-id', '758', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmptf4ravda'] +INFO - Job 758: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-26T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180626T000000, start_date=20221111T005911, end_date=20221111T005918 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-06-26T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:59:18.707278Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "da0ac867-e422-4209-9477-00f64a119c0b"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..f690e670 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:59:10.108215Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c9bdf132-4e71-3179-8515-d58a137e877a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "c9bdf132-4e71-3179-8515-d58a137e877a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "dfb1f1e1-da00-4d28-a20e-fc1b61cafafe"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-06-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:59:10.108215+00:00, try_number=1, job_id=757, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-26 00:00:00+00:00 +INFO - Started process 6291 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-06-26T00:00:00+00:00', '--job-id', '757', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmppdw0hsxf'] +INFO - Job 757: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-26T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180626T000000, start_date=20221111T005910, end_date=20221111T005912 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-06-26T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:59:12.648458Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "dfb1f1e1-da00-4d28-a20e-fc1b61cafafe"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..6733267b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:59:24.250922Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "71b432fa-73f3-37c3-828f-baf549097c28"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "71b432fa-73f3-37c3-828f-baf549097c28"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b3babebf-9f6d-485f-93b2-fb25e25f5202"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-06-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:59:24.250922+00:00, try_number=1, job_id=761, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-27 00:00:00+00:00 +INFO - Started process 6324 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-06-27T00:00:00+00:00', '--job-id', '761', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpomqo0kp4'] +INFO - Job 761: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-27T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180627T000000, start_date=20221111T005924, end_date=20221111T005928 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-06-27T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:59:28.613580Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b3babebf-9f6d-485f-93b2-fb25e25f5202"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..6180c326 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:59:24.336231Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "71b432fa-73f3-37c3-828f-baf549097c28"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "71b432fa-73f3-37c3-828f-baf549097c28"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e68a9e5d-9182-4d76-ada3-1ff8b8a63948"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-06-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:59:24.336231+00:00, try_number=1, job_id=762, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-27 00:00:00+00:00 +INFO - Started process 6325 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-06-27T00:00:00+00:00', '--job-id', '762', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpvfkae2u4'] +INFO - Job 762: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-27T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180627T000000, start_date=20221111T005924, end_date=20221111T005928 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-06-27T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:59:28.397645Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e68a9e5d-9182-4d76-ada3-1ff8b8a63948"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..a233a522 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:59:37.343089Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "71b432fa-73f3-37c3-828f-baf549097c28"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "71b432fa-73f3-37c3-828f-baf549097c28"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5697a583-835c-4705-ab3a-a464e77e3eca"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-06-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:59:37.343089+00:00, try_number=1, job_id=766, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-27 00:00:00+00:00 +INFO - Started process 6319 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-06-27T00:00:00+00:00', '--job-id', '766', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpm6cjyyyj'] +INFO - Job 766: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-27T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6ca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'QxgV2Qa93+XXkSYzq7kD8w==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:QxgV2Qa93+XXkSYzq7kD8w== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005938Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005938Z +20221111/us-east-1/s3/aws4_request +2f7b4a6ea6da67c0f2dba151af035b4415d61388b6701d41a09bd5ea66a00aa9 +INFO - '2022-11-11' - botocore.auth - Signature: +5ffbb1f3075f236f2091975242f0c71840420f7925e7c61fd9c426c1e7e6d63c +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'Xu+r7O2zQbCbP0X3LJIji+wfs1fSAV1L8zo6WvbQ2QFgYIIoxkiLupcSejhv1v1Dm4XwEeyLoppBaGR4+bY21g==', 'x-amz-request-id': 'TVFXKDEX0RQZV6GW', 'Date': 'Fri, 11 Nov 2022 00:59:38 GMT', 'ETag': '"431815d906bddfe5d7912633abb903f3"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180627T000000, start_date=20221111T005937, end_date=20221111T005939 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-06-27T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:59:39.283308Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5697a583-835c-4705-ab3a-a464e77e3eca"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..4a27b9be --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:59:35.255042Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "71b432fa-73f3-37c3-828f-baf549097c28"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "71b432fa-73f3-37c3-828f-baf549097c28"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cd0ddf70-16ed-4593-b611-74f4ae477c8c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-06-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:59:35.255042+00:00, try_number=1, job_id=765, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-27 00:00:00+00:00 +INFO - Started process 6399 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-06-27T00:00:00+00:00', '--job-id', '765', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp8xmzztci'] +INFO - Job 765: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-27T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499523a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005936Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005936Z +20221111/us-east-1/s3/aws4_request +d310129dbb1b30b745bccb291fcd197a4263a6891e887c40b9257721da082056 +INFO - '2022-11-11' - botocore.auth - Signature: +f4b61ea2d57908951ea69b9db7ccf2147069a654391903b8e0e905ff64bae5cc +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'eWdIOv7X7502RmxLSg6PEj4iTqSzEGu9JRAqUas5sPBD+BklYUYQSSprKK2BmcEJLKgAeoG6M9M=', 'x-amz-request-id': '60WD16VTD2JTS20Q', 'Date': 'Fri, 11 Nov 2022 00:59:36 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180627T000000, start_date=20221111T005935, end_date=20221111T005937 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-06-27T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:59:37.534224Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cd0ddf70-16ed-4593-b611-74f4ae477c8c"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..cd69ab3f --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:59:30.579161Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "71b432fa-73f3-37c3-828f-baf549097c28"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "71b432fa-73f3-37c3-828f-baf549097c28"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f6ff2975-d404-45e9-93d3-ab0aa0cdb89a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-06-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:59:30.579161+00:00, try_number=1, job_id=763, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-27 00:00:00+00:00 +INFO - Started process 6392 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-06-27T00:00:00+00:00', '--job-id', '763', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpxizhvtc7'] +INFO - Job 763: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-27T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180627T000000, start_date=20221111T005930, end_date=20221111T005935 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-06-27T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:59:35.665549Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f6ff2975-d404-45e9-93d3-ab0aa0cdb89a"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..febd304c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:59:30.609354Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "71b432fa-73f3-37c3-828f-baf549097c28"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "71b432fa-73f3-37c3-828f-baf549097c28"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9b8382c4-6040-4f4b-b336-3a568f1eb398"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-06-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:59:30.609354+00:00, try_number=1, job_id=764, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-27 00:00:00+00:00 +INFO - Started process 6394 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-06-27T00:00:00+00:00', '--job-id', '764', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpq6ct0nca'] +INFO - Job 764: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-27T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180627T000000, start_date=20221111T005930, end_date=20221111T005933 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-06-27T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:59:33.541577Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9b8382c4-6040-4f4b-b336-3a568f1eb398"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..7bb26b9e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:59:41.566788Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "80e535a3-7981-375d-bb44-05a74cbc344c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "80e535a3-7981-375d-bb44-05a74cbc344c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "01e19ba2-cfab-46bc-88a2-b7a5edda264d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-06-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:59:41.566788+00:00, try_number=1, job_id=767, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-28 00:00:00+00:00 +INFO - Started process 6353 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-06-28T00:00:00+00:00', '--job-id', '767', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpr5el6huw'] +INFO - Job 767: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-28T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180628T000000, start_date=20221111T005941, end_date=20221111T005944 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-06-28T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:59:44.595655Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "01e19ba2-cfab-46bc-88a2-b7a5edda264d"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..bee524d3 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:59:41.565819Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "80e535a3-7981-375d-bb44-05a74cbc344c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "80e535a3-7981-375d-bb44-05a74cbc344c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bc6cc789-8250-4d56-b424-fd336f818ad0"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-06-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:59:41.565819+00:00, try_number=1, job_id=768, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-28 00:00:00+00:00 +INFO - Started process 6355 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-06-28T00:00:00+00:00', '--job-id', '768', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpadw_3b37'] +INFO - Job 768: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-28T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180628T000000, start_date=20221111T005941, end_date=20221111T005944 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-06-28T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:59:44.616130Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bc6cc789-8250-4d56-b424-fd336f818ad0"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..701d9590 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:59:54.366984Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "80e535a3-7981-375d-bb44-05a74cbc344c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "80e535a3-7981-375d-bb44-05a74cbc344c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "988e3712-3e03-4334-80ae-b90c0edaff1e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-06-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:59:54.366984+00:00, try_number=1, job_id=772, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-28 00:00:00+00:00 +INFO - Started process 6414 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-06-28T00:00:00+00:00', '--job-id', '772', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpvhic424u'] +INFO - Job 772: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-28T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498eff70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'mmac8aRB+9JVwczaFWI8nQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:mmac8aRB+9JVwczaFWI8nQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005955Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005955Z +20221111/us-east-1/s3/aws4_request +d83d786131dcb4fa520c4ded7909d2e50376057dd867ef73bbd4c2ba4a042bf8 +INFO - '2022-11-11' - botocore.auth - Signature: +2c48e8962a39aa18d43b8e6b28eeb642655fd8efbba1320ffae454229f9c5f95 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '7XqgEwk2ZTTeL3vBv5MB6W0oUn7CS+OICwuBbWPshFaQQts78OYATADiQVTNRg5HgO+zRbPklMQ=', 'x-amz-request-id': 'QCYYYHHPWPHGCA37', 'Date': 'Fri, 11 Nov 2022 00:59:55 GMT', 'ETag': '"9a669cf1a441fbd255c1ccda15623c9d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180628T000000, start_date=20221111T005954, end_date=20221111T005956 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-06-28T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:59:56.629005Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "988e3712-3e03-4334-80ae-b90c0edaff1e"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..eb67c216 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:59:51.356114Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "80e535a3-7981-375d-bb44-05a74cbc344c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "80e535a3-7981-375d-bb44-05a74cbc344c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ffa0e99d-c039-4ed9-88a9-a0de77310839"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-06-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:59:51.356114+00:00, try_number=1, job_id=771, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-28 00:00:00+00:00 +INFO - Started process 6407 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-06-28T00:00:00+00:00', '--job-id', '771', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpa7r326od'] +INFO - Job 771: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-28T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499533a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T005952Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T005952Z +20221111/us-east-1/s3/aws4_request +5f87c326cd162885fdf59496133d9cb36d8f4052138f6a655521fa22425ffe46 +INFO - '2022-11-11' - botocore.auth - Signature: +bdbfd74fbce1eaf3778c6f22f6094e7e75236fd9a9fc47cc4c275712276d96fa +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'y5eEKAV8xWYVCMRR4DKq4Du5mvMde536Qodd3kAj+K3ECZQP2qzR5XjbsE58n8kLUglHXD2qLWc=', 'x-amz-request-id': 'MSHBXNRSYBH4MEET', 'Date': 'Fri, 11 Nov 2022 00:59:52 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180628T000000, start_date=20221111T005951, end_date=20221111T005953 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-06-28T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:59:53.407064Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ffa0e99d-c039-4ed9-88a9-a0de77310839"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..6af2b210 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:59:46.551348Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "80e535a3-7981-375d-bb44-05a74cbc344c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "80e535a3-7981-375d-bb44-05a74cbc344c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7ca460c6-4579-4f2c-9654-2e4ff0ad02ee"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-06-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:59:46.551348+00:00, try_number=1, job_id=769, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-28 00:00:00+00:00 +INFO - Started process 6397 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-06-28T00:00:00+00:00', '--job-id', '769', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpj6j0gys3'] +INFO - Job 769: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-28T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180628T000000, start_date=20221111T005946, end_date=20221111T005952 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-06-28T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:59:52.193022Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7ca460c6-4579-4f2c-9654-2e4ff0ad02ee"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..5a7b9405 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:59:46.689409Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "80e535a3-7981-375d-bb44-05a74cbc344c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "80e535a3-7981-375d-bb44-05a74cbc344c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4bc4512a-86b0-4fc1-b983-6e5e99fc63c2"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-06-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:59:46.689409+00:00, try_number=1, job_id=770, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-28 00:00:00+00:00 +INFO - Started process 6400 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-06-28T00:00:00+00:00', '--job-id', '770', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp2efj2cgr'] +INFO - Job 770: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-28T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180628T000000, start_date=20221111T005946, end_date=20221111T005949 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-06-28T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T00:59:49.567700Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4bc4512a-86b0-4fc1-b983-6e5e99fc63c2"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..0146bf6d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:59:59.226625Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-29T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "18a092e7-b9df-3a6c-ba58-74efe9baaaad"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "18a092e7-b9df-3a6c-ba58-74efe9baaaad"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4670b45a-b210-4e8d-9349-0c93a005d368"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-06-29T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:59:59.226625+00:00, try_number=1, job_id=773, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-29 00:00:00+00:00 +INFO - Started process 6413 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-06-29T00:00:00+00:00', '--job-id', '773', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpo4qbaz3x'] +INFO - Job 773: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-29T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-29T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180629T000000, start_date=20221111T005959, end_date=20221111T010002 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-06-29T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:00:02.936937Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4670b45a-b210-4e8d-9349-0c93a005d368"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..75017b67 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T00:59:59.226498Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-29T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "18a092e7-b9df-3a6c-ba58-74efe9baaaad"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "18a092e7-b9df-3a6c-ba58-74efe9baaaad"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e914156d-273d-43f5-bfc2-bf4ca87ed5b4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-06-29T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 00:59:59.226498+00:00, try_number=1, job_id=774, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-29 00:00:00+00:00 +INFO - Started process 6415 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-06-29T00:00:00+00:00', '--job-id', '774', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp4jgzt33i'] +INFO - Job 774: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-29T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-29T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180629T000000, start_date=20221111T005959, end_date=20221111T010003 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-06-29T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:00:03.104015Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e914156d-273d-43f5-bfc2-bf4ca87ed5b4"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..a65b47e8 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:00:19.003475Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-29T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "18a092e7-b9df-3a6c-ba58-74efe9baaaad"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "18a092e7-b9df-3a6c-ba58-74efe9baaaad"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0e252e20-a243-4982-a62b-c4ade4ceda0d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-06-29T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:00:19.003475+00:00, try_number=1, job_id=778, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-29 00:00:00+00:00 +INFO - Started process 6503 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-06-29T00:00:00+00:00', '--job-id', '778', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp339x1s9o'] +INFO - Job 778: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-29T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-29T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498ef940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'P3/XD2Zthy++pyQKyX/UBQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:P3/XD2Zthy++pyQKyX/UBQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010020Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010020Z +20221111/us-east-1/s3/aws4_request +ea5833a1b839c73528ad1b151afe78fbaf327fdee25d2e9f2a429c9d561beb5b +INFO - '2022-11-11' - botocore.auth - Signature: +2d1ff1e2f803801806675b5b188b73d9a9911793a41822ccdf67701ac6a4be92 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'puPB4cpkXSHoPORrimnmZwYhieFBtuM7uCNnys/L1EVQrKeWPAMvrsKt1oIHjsuaTTd2WH3F4cw=', 'x-amz-request-id': 'VGDRKWECM35H3HW2', 'Date': 'Fri, 11 Nov 2022 01:00:21 GMT', 'ETag': '"3f7fd70f666d872fbea7240ac97fd405"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180629T000000, start_date=20221111T010019, end_date=20221111T010022 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-06-29T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:00:22.143358Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0e252e20-a243-4982-a62b-c4ade4ceda0d"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..78d84953 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:00:12.937401Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-29T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "18a092e7-b9df-3a6c-ba58-74efe9baaaad"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "18a092e7-b9df-3a6c-ba58-74efe9baaaad"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7377f6c1-05bf-40ec-9e3e-0ed7a1041fae"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-06-29T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:00:12.937401+00:00, try_number=1, job_id=777, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-29 00:00:00+00:00 +INFO - Started process 6495 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-06-29T00:00:00+00:00', '--job-id', '777', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpnuu_xzkn'] +INFO - Job 777: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-29T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-29T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499543a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010014Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010014Z +20221111/us-east-1/s3/aws4_request +36ffaf45575e03aa2e223f551c9c270968061a07658ccc599ce126e6e53e535d +INFO - '2022-11-11' - botocore.auth - Signature: +02761e0642f867f1dde5ca45d14ba32f56beffc97246cc6dbe40f88b8dc18490 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'sw52imTQilGk0nrMxPGrmh5mKk1WYMPMMUzQsEkgl1LyMtEiGcTtZ7RL/UuQPgopSKGJ3igH5ow=', 'x-amz-request-id': '58SJ6YENG2CMH0CF', 'Date': 'Fri, 11 Nov 2022 01:00:15 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180629T000000, start_date=20221111T010012, end_date=20221111T010016 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-06-29T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:00:16.189576Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7377f6c1-05bf-40ec-9e3e-0ed7a1041fae"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..ab2f2b3a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:00:05.103095Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-29T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "18a092e7-b9df-3a6c-ba58-74efe9baaaad"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "18a092e7-b9df-3a6c-ba58-74efe9baaaad"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bb965f4d-8a74-4bf7-86b6-4b9f60b03556"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-06-29T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:00:05.103095+00:00, try_number=1, job_id=775, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-29 00:00:00+00:00 +INFO - Started process 6487 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-06-29T00:00:00+00:00', '--job-id', '775', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpjw21ug_w'] +INFO - Job 775: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-29T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-29T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180629T000000, start_date=20221111T010005, end_date=20221111T010016 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-06-29T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:00:16.505353Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bb965f4d-8a74-4bf7-86b6-4b9f60b03556"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..6d82cb90 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:00:05.889679Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-29T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "18a092e7-b9df-3a6c-ba58-74efe9baaaad"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "18a092e7-b9df-3a6c-ba58-74efe9baaaad"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "758daeae-9005-4621-bf6d-f0d5da78fd9b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-06-29T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:00:05.889679+00:00, try_number=1, job_id=776, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-29 00:00:00+00:00 +INFO - Started process 6490 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-06-29T00:00:00+00:00', '--job-id', '776', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmplrzw76v5'] +INFO - Job 776: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-29T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-29T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180629T000000, start_date=20221111T010005, end_date=20221111T010009 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-06-29T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:00:09.340825Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "758daeae-9005-4621-bf6d-f0d5da78fd9b"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..dfe67b91 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:00:25.435170Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-30T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0055d521-1ec2-3d5a-8f2b-53bf7af9a787"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0055d521-1ec2-3d5a-8f2b-53bf7af9a787"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4036c3df-988e-4df5-9d33-6be23190b518"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-06-30T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:00:25.435170+00:00, try_number=1, job_id=779, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-30 00:00:00+00:00 +INFO - Started process 6423 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-06-30T00:00:00+00:00', '--job-id', '779', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpn7_4ew7n'] +INFO - Job 779: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-30T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-30T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180630T000000, start_date=20221111T010025, end_date=20221111T010029 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-06-30T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:00:29.076465Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4036c3df-988e-4df5-9d33-6be23190b518"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..a015b902 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:00:25.579066Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-30T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0055d521-1ec2-3d5a-8f2b-53bf7af9a787"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0055d521-1ec2-3d5a-8f2b-53bf7af9a787"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f3c284af-10d7-48f9-bb64-9bc3be7570f6"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-06-30T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:00:25.579066+00:00, try_number=1, job_id=780, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-30 00:00:00+00:00 +INFO - Started process 6425 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-06-30T00:00:00+00:00', '--job-id', '780', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp15sjswbi'] +INFO - Job 780: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-30T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-30T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180630T000000, start_date=20221111T010025, end_date=20221111T010029 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-06-30T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:00:29.257270Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f3c284af-10d7-48f9-bb64-9bc3be7570f6"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..1b7b4881 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:00:45.453506Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-30T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0055d521-1ec2-3d5a-8f2b-53bf7af9a787"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0055d521-1ec2-3d5a-8f2b-53bf7af9a787"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c389c631-fd8e-4e06-8c29-08498cd0f078"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-06-30T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:00:45.453506+00:00, try_number=1, job_id=784, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-30 00:00:00+00:00 +INFO - Started process 6474 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-06-30T00:00:00+00:00', '--job-id', '784', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpc0jrneky'] +INFO - Job 784: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-30T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-30T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'qUfyROg9sV6XZM7VzinXVA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:qUfyROg9sV6XZM7VzinXVA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010046Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010046Z +20221111/us-east-1/s3/aws4_request +5f3575116e98ae9d95a74dc963246e2812a51af801235b42e4f752ecc9d5f4b4 +INFO - '2022-11-11' - botocore.auth - Signature: +2a950b71999d99c7f8e78971c707641903e9b6c8fa005eea7ca2b21173875795 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '0gMz+g7/1lr2+EpH2+DfMGqXsC8ZSyZZfAj0N0UbTiNDPVCOgp6r5gZG8C/v6BpArJu0qfheV0I=', 'x-amz-request-id': 'WGC9GXERSH4ENB7Y', 'Date': 'Fri, 11 Nov 2022 01:00:47 GMT', 'ETag': '"a947f244e83db15e9764ced5ce29d754"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180630T000000, start_date=20221111T010045, end_date=20221111T010048 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-06-30T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:00:48.521664Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c389c631-fd8e-4e06-8c29-08498cd0f078"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..032fedcd --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:00:39.147340Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-30T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0055d521-1ec2-3d5a-8f2b-53bf7af9a787"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0055d521-1ec2-3d5a-8f2b-53bf7af9a787"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e1efbd3e-b807-4950-aeaa-34054d14c56e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-06-30T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:00:39.147340+00:00, try_number=1, job_id=783, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-30 00:00:00+00:00 +INFO - Started process 6436 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-06-30T00:00:00+00:00', '--job-id', '783', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpgbeulcib'] +INFO - Job 783: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-30T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-30T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50071f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010040Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010040Z +20221111/us-east-1/s3/aws4_request +b1ef6b9513ef171799d00bd976bd9a3ed5c3df6f5983331a7ed4c09534f56d13 +INFO - '2022-11-11' - botocore.auth - Signature: +61af0bf878ae5161e5d16ff57f809a5da1d8ee4e63175b9826ad17f02d5bc894 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'ZQalNcYhAogjde2HvFwmslVgFn2guYRYCQKvCa/fVpNvVh8gX5dCXQib4xB2Krx/TMMgSNuImxc=', 'x-amz-request-id': '02SQBSZ2SMWQK5QX', 'Date': 'Fri, 11 Nov 2022 01:00:41 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180630T000000, start_date=20221111T010039, end_date=20221111T010041 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-06-30T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:00:41.821007Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e1efbd3e-b807-4950-aeaa-34054d14c56e"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..4dabc795 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:00:32.117893Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-30T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0055d521-1ec2-3d5a-8f2b-53bf7af9a787"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0055d521-1ec2-3d5a-8f2b-53bf7af9a787"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "73c6d4f9-6ebf-4929-b184-a6626eab5059"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-06-30T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:00:32.117893+00:00, try_number=1, job_id=781, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-30 00:00:00+00:00 +INFO - Started process 6510 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-06-30T00:00:00+00:00', '--job-id', '781', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpzay8g09j'] +INFO - Job 781: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-30T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-30T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180630T000000, start_date=20221111T010032, end_date=20221111T010042 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-06-30T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:00:42.378166Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "73c6d4f9-6ebf-4929-b184-a6626eab5059"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..2cbd5cfb --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-06-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:00:32.907561Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-06-30T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0055d521-1ec2-3d5a-8f2b-53bf7af9a787"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0055d521-1ec2-3d5a-8f2b-53bf7af9a787"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "75734b77-b4c7-477d-b1e9-dd6ceed687f4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-06-30T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:00:32.907561+00:00, try_number=1, job_id=782, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-06-30 00:00:00+00:00 +INFO - Started process 6431 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-06-30T00:00:00+00:00', '--job-id', '782', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpj_a5cj67'] +INFO - Job 782: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-06-30T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-06-30T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180630T000000, start_date=20221111T010032, end_date=20221111T010036 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-06-30T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:00:36.514507Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "75734b77-b4c7-477d-b1e9-dd6ceed687f4"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..b87cc43c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:00:51.731595Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0452f127-df8e-3c5f-978b-26db83699f63"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0452f127-df8e-3c5f-978b-26db83699f63"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6c24ba87-78ec-4c66-b423-68d1aa359e71"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-07-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:00:51.731595+00:00, try_number=1, job_id=785, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-01 00:00:00+00:00 +INFO - Started process 6519 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-07-01T00:00:00+00:00', '--job-id', '785', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpsdcbhblt'] +INFO - Job 785: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180701T000000, start_date=20221111T010051, end_date=20221111T010055 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-07-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:00:55.843406Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6c24ba87-78ec-4c66-b423-68d1aa359e71"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..995586e3 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:00:51.688530Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0452f127-df8e-3c5f-978b-26db83699f63"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0452f127-df8e-3c5f-978b-26db83699f63"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "abac4b2a-3032-4080-b9f1-720a6b9abfce"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-07-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:00:51.688530+00:00, try_number=1, job_id=786, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-01 00:00:00+00:00 +INFO - Started process 6516 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-07-01T00:00:00+00:00', '--job-id', '786', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpopu87j8g'] +INFO - Job 786: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180701T000000, start_date=20221111T010051, end_date=20221111T010055 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-07-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:00:55.850863Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "abac4b2a-3032-4080-b9f1-720a6b9abfce"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..27a0c679 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:01:07.486702Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0452f127-df8e-3c5f-978b-26db83699f63"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0452f127-df8e-3c5f-978b-26db83699f63"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "58bf26bb-b009-40d5-bedd-1a81a0ee372b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-07-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:01:07.486702+00:00, try_number=1, job_id=790, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-01 00:00:00+00:00 +INFO - Started process 6527 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-07-01T00:00:00+00:00', '--job-id', '790', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp7r1_wqbe'] +INFO - Job 790: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'S0uEC+zKfYdOaqRPHzboFw==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:S0uEC+zKfYdOaqRPHzboFw== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010108Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010108Z +20221111/us-east-1/s3/aws4_request +3beddff7790cde77382c8828a77faa96c0ca7d9c88869c0b6cd482df8fb2f4a4 +INFO - '2022-11-11' - botocore.auth - Signature: +b153eead38b43f5648eb677c1496b6892be11279c8bfb3aeb4f6bcf14a45ca05 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'W+/tZ56j9a5YcZrREP04n9wlJgoLJ8de9tA8fC4TvdxyDmn/oqVhL8ooskrWLabib20pX0SI/3Y=', 'x-amz-request-id': 'VCBTRJ9XYGMCGY37', 'Date': 'Fri, 11 Nov 2022 01:01:08 GMT', 'ETag': '"4b4b840becca7d874e6aa44f1f36e817"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180701T000000, start_date=20221111T010107, end_date=20221111T010109 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-07-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:01:09.424813Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "58bf26bb-b009-40d5-bedd-1a81a0ee372b"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..38752d84 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:01:05.004552Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0452f127-df8e-3c5f-978b-26db83699f63"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0452f127-df8e-3c5f-978b-26db83699f63"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f51294ef-7b3e-46b0-b895-d319bc32f5d6"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-07-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:01:05.004552+00:00, try_number=1, job_id=789, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-01 00:00:00+00:00 +INFO - Started process 6520 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-07-01T00:00:00+00:00', '--job-id', '789', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp0u5t70ei'] +INFO - Job 789: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f6249954550> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010106Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010106Z +20221111/us-east-1/s3/aws4_request +81945800fa7b5d8c4f11bde3f0a181f3c9ac96b9659441861900842ca0719a96 +INFO - '2022-11-11' - botocore.auth - Signature: +4ba97ba279cde22fdfade61a30fdf00d74b427a84a9108b5042bb61a33f51dfe +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'X3D1rbsTiKB/gFBf8mHDGFqVZCdzrM1KpICNxcHKqPuxZvXj96vGctloozmZr7r5QDT69LeD+OY=', 'x-amz-request-id': 'WACDW4Z3BDX1G154', 'Date': 'Fri, 11 Nov 2022 01:01:06 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180701T000000, start_date=20221111T010105, end_date=20221111T010107 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-07-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:01:07.592269Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f51294ef-7b3e-46b0-b895-d319bc32f5d6"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..3ae0dd9b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:00:58.374235Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0452f127-df8e-3c5f-978b-26db83699f63"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0452f127-df8e-3c5f-978b-26db83699f63"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "50ad62c7-9de5-4ce4-bbb3-27b7a7fc4201"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-07-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:00:58.374235+00:00, try_number=1, job_id=787, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-01 00:00:00+00:00 +INFO - Started process 6529 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-07-01T00:00:00+00:00', '--job-id', '787', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpp5x00qd7'] +INFO - Job 787: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180701T000000, start_date=20221111T010058, end_date=20221111T010105 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-07-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:01:05.559790Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "50ad62c7-9de5-4ce4-bbb3-27b7a7fc4201"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..74859018 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:00:58.425013Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0452f127-df8e-3c5f-978b-26db83699f63"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0452f127-df8e-3c5f-978b-26db83699f63"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bc23e659-6878-4675-9738-e46e8876e9e8"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-07-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:00:58.425013+00:00, try_number=1, job_id=788, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-01 00:00:00+00:00 +INFO - Started process 6528 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-07-01T00:00:00+00:00', '--job-id', '788', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp_3f9737l'] +INFO - Job 788: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180701T000000, start_date=20221111T010058, end_date=20221111T010102 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-07-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:01:02.075834Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bc23e659-6878-4675-9738-e46e8876e9e8"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..cfd04e14 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:01:11.787240Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "58855754-fde6-3824-8d02-28eeff4e792f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "58855754-fde6-3824-8d02-28eeff4e792f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9d65d070-a101-4971-846f-ff707a758958"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-07-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:01:11.787240+00:00, try_number=1, job_id=791, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-02 00:00:00+00:00 +INFO - Started process 6537 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-07-02T00:00:00+00:00', '--job-id', '791', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpgodb126w'] +INFO - Job 791: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180702T000000, start_date=20221111T010111, end_date=20221111T010116 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-07-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:01:16.232980Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9d65d070-a101-4971-846f-ff707a758958"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..9b39632a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:01:11.816689Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "58855754-fde6-3824-8d02-28eeff4e792f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "58855754-fde6-3824-8d02-28eeff4e792f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a8d69c64-5931-4906-88b3-f26d3382af87"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-07-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:01:11.816689+00:00, try_number=1, job_id=792, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-02 00:00:00+00:00 +INFO - Started process 6538 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-07-02T00:00:00+00:00', '--job-id', '792', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp33i9hiqk'] +INFO - Job 792: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180702T000000, start_date=20221111T010111, end_date=20221111T010116 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-07-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:01:16.139274Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a8d69c64-5931-4906-88b3-f26d3382af87"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..64fe2fd8 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:01:27.405666Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "58855754-fde6-3824-8d02-28eeff4e792f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "58855754-fde6-3824-8d02-28eeff4e792f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bdc74dc2-fa34-4427-8a02-3946c92ef457"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-07-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:01:27.405666+00:00, try_number=1, job_id=796, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-02 00:00:00+00:00 +INFO - Started process 6610 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-07-02T00:00:00+00:00', '--job-id', '796', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp_r5z_me3'] +INFO - Job 796: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5ca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'HeOOW7K4nPRpAiP2uACbfQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:HeOOW7K4nPRpAiP2uACbfQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010128Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010128Z +20221111/us-east-1/s3/aws4_request +343e3de141cfa594c5cb20fe13fb294c948f5b12b38e3ca836971c1d2600a20b +INFO - '2022-11-11' - botocore.auth - Signature: +e0597de2fae911e1dfeec39a44eff7d39af39cb0b497f46bc5c777e0061c6f82 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'HzHAyWar7FaR6s6DaYQ0Sue0fOlIpdRFkGhjthA6VROj6IP2iQYSTfy0AZsyWXBq8B/qepVuXuQ=', 'x-amz-request-id': 'TZXXFHYYD9NW2V6M', 'Date': 'Fri, 11 Nov 2022 01:01:28 GMT', 'ETag': '"1de38e5bb2b89cf4690223f6b8009b7d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180702T000000, start_date=20221111T010127, end_date=20221111T010129 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-07-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:01:29.478296Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bdc74dc2-fa34-4427-8a02-3946c92ef457"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..d7fff5fd --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:01:25.348113Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "58855754-fde6-3824-8d02-28eeff4e792f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "58855754-fde6-3824-8d02-28eeff4e792f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "40d8797d-f024-4728-bb02-8849505ee165"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-07-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:01:25.348113+00:00, try_number=1, job_id=795, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-02 00:00:00+00:00 +INFO - Started process 6544 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-07-02T00:00:00+00:00', '--job-id', '795', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp6xa4m88e'] +INFO - Job 795: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499531f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010126Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010126Z +20221111/us-east-1/s3/aws4_request +adb3a95b6c552e683321ddc722fe1ea2f2c64ac9186223f78ae3ae4169480e3a +INFO - '2022-11-11' - botocore.auth - Signature: +0003ed90a5163d5bfa45e5d4bd79515ed09490868a1038dac02b54044ba0ed5c +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'KZNLJ9stn3NvS9lYmHd71aFdnCLGcnMH+HEFKAHpP0fWprGctmonmbyqmE5NeQJc4orDr1yBt2E=', 'x-amz-request-id': '2887Z01A9PCD7Z41', 'Date': 'Fri, 11 Nov 2022 01:01:27 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180702T000000, start_date=20221111T010125, end_date=20221111T010127 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-07-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:01:27.974080Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "40d8797d-f024-4728-bb02-8849505ee165"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..ac9e564a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:01:18.722503Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "58855754-fde6-3824-8d02-28eeff4e792f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "58855754-fde6-3824-8d02-28eeff4e792f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "10024b41-597e-4931-80cc-1a79f50bc1b9"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-07-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:01:18.722503+00:00, try_number=1, job_id=793, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-02 00:00:00+00:00 +INFO - Started process 6601 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-07-02T00:00:00+00:00', '--job-id', '793', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpbrxdgvcv'] +INFO - Job 793: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180702T000000, start_date=20221111T010118, end_date=20221111T010125 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-07-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:01:25.632078Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "10024b41-597e-4931-80cc-1a79f50bc1b9"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..491750b9 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:01:19.119905Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "58855754-fde6-3824-8d02-28eeff4e792f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "58855754-fde6-3824-8d02-28eeff4e792f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1a24932b-0517-461b-bb5f-ecd1511a2ef0"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-07-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:01:19.119905+00:00, try_number=1, job_id=794, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-02 00:00:00+00:00 +INFO - Started process 6604 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-07-02T00:00:00+00:00', '--job-id', '794', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpysiu61lb'] +INFO - Job 794: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180702T000000, start_date=20221111T010119, end_date=20221111T010122 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-07-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:01:22.424493Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1a24932b-0517-461b-bb5f-ecd1511a2ef0"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..433bc31f --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:01:31.962436Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "180349ef-e57f-36c3-8991-06a0439d4d32"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "180349ef-e57f-36c3-8991-06a0439d4d32"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ecb0ec6b-8a20-4752-97f1-46c4c92ade5b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-07-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:01:31.962436+00:00, try_number=1, job_id=797, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-03 00:00:00+00:00 +INFO - Started process 6552 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-07-03T00:00:00+00:00', '--job-id', '797', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpzg6la78r'] +INFO - Job 797: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180703T000000, start_date=20221111T010131, end_date=20221111T010135 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-07-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:01:35.555178Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ecb0ec6b-8a20-4752-97f1-46c4c92ade5b"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..81ad6cb6 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:01:32.041249Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "180349ef-e57f-36c3-8991-06a0439d4d32"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "180349ef-e57f-36c3-8991-06a0439d4d32"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6e5a0c7d-bd17-42fb-875a-28931d3823b5"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-07-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:01:32.041249+00:00, try_number=1, job_id=798, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-03 00:00:00+00:00 +INFO - Started process 6555 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-07-03T00:00:00+00:00', '--job-id', '798', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpcqgk36o5'] +INFO - Job 798: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180703T000000, start_date=20221111T010132, end_date=20221111T010135 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-07-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:01:35.518294Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6e5a0c7d-bd17-42fb-875a-28931d3823b5"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..c525e530 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:01:42.835783Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "180349ef-e57f-36c3-8991-06a0439d4d32"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "180349ef-e57f-36c3-8991-06a0439d4d32"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "256acd88-bd5c-4a4b-906c-94d90f80ec38"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-07-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:01:42.835783+00:00, try_number=1, job_id=802, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-03 00:00:00+00:00 +INFO - Started process 6617 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-07-03T00:00:00+00:00', '--job-id', '802', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp6rq03nzv'] +INFO - Job 802: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5ca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'HeOOW7K4nPRpAiP2uACbfQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:HeOOW7K4nPRpAiP2uACbfQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010143Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010143Z +20221111/us-east-1/s3/aws4_request +faecab2164264500f34a8484d41c85f1bb636882932ca3b8c2af3d5d83d29175 +INFO - '2022-11-11' - botocore.auth - Signature: +9b85b80fad2ac0531b1c307f8fbef19b8a65fa4f5bf130ada162fee1bf577602 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'AbrURGXkqq1tR1JYTMlfIu7Mk+IwoaUGjd15VuYBPc1oJsb08u33NJcG6UlaMuctuSQ3G+WY1aA=', 'x-amz-request-id': '87QYTK7YC473S34T', 'Date': 'Fri, 11 Nov 2022 01:01:44 GMT', 'ETag': '"1de38e5bb2b89cf4690223f6b8009b7d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180703T000000, start_date=20221111T010142, end_date=20221111T010144 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-07-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:01:44.710930Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "256acd88-bd5c-4a4b-906c-94d90f80ec38"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..240f1bba --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:01:41.585857Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "180349ef-e57f-36c3-8991-06a0439d4d32"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "180349ef-e57f-36c3-8991-06a0439d4d32"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "66551dcd-71c2-42bc-ab3d-8e8237406f65"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-07-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:01:41.585857+00:00, try_number=1, job_id=801, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-03 00:00:00+00:00 +INFO - Started process 6636 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-07-03T00:00:00+00:00', '--job-id', '801', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp6b2praf2'] +INFO - Job 801: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0ee0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010142Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010142Z +20221111/us-east-1/s3/aws4_request +666db416688c3a50f6ef46962cd81d3463ce5880fa3aacf71a335edeaa17f08c +INFO - '2022-11-11' - botocore.auth - Signature: +c8874993596f75f20726ef4f1dfaf82245175919f60bc71c4e24e8bb2ed85530 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'c11kq3xK1HvUpk4KM62KUjR9UQeFur1iy70d1r//q+T+Pv9maNa6jm9JE2EznTs/vaWsN622/yQ=', 'x-amz-request-id': 'TAN5QRXFV94QQWD8', 'Date': 'Fri, 11 Nov 2022 01:01:42 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180703T000000, start_date=20221111T010141, end_date=20221111T010143 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-07-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:01:43.464475Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "66551dcd-71c2-42bc-ab3d-8e8237406f65"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..7803ca2c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:01:37.145673Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "180349ef-e57f-36c3-8991-06a0439d4d32"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "180349ef-e57f-36c3-8991-06a0439d4d32"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e65129b5-4ce5-4a5a-a6ad-966233859833"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-07-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:01:37.145673+00:00, try_number=1, job_id=800, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-03 00:00:00+00:00 +INFO - Started process 6630 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-07-03T00:00:00+00:00', '--job-id', '800', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpfwincetb'] +INFO - Job 800: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180703T000000, start_date=20221111T010137, end_date=20221111T010141 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-07-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:01:41.522869Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e65129b5-4ce5-4a5a-a6ad-966233859833"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..e2948b82 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:01:37.052133Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "180349ef-e57f-36c3-8991-06a0439d4d32"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "180349ef-e57f-36c3-8991-06a0439d4d32"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "54874422-55cf-47d5-a555-51557efb42a9"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-07-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:01:37.052133+00:00, try_number=1, job_id=799, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-03 00:00:00+00:00 +INFO - Started process 6628 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-07-03T00:00:00+00:00', '--job-id', '799', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpstbvj1l3'] +INFO - Job 799: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180703T000000, start_date=20221111T010137, end_date=20221111T010139 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-07-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:01:39.993376Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "54874422-55cf-47d5-a555-51557efb42a9"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..6998b044 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:01:46.779114Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d9c8aa35-f2e0-35a7-b424-15b6c07399e3"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d9c8aa35-f2e0-35a7-b424-15b6c07399e3"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "887f808e-77dc-43f3-b1ad-d4037c99528d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-07-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:01:46.779114+00:00, try_number=1, job_id=804, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-04 00:00:00+00:00 +INFO - Started process 6641 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-07-04T00:00:00+00:00', '--job-id', '804', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp8ttc0qzc'] +INFO - Job 804: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180704T000000, start_date=20221111T010146, end_date=20221111T010150 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-07-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:01:50.378970Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "887f808e-77dc-43f3-b1ad-d4037c99528d"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..318e00b9 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:01:46.778717Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d9c8aa35-f2e0-35a7-b424-15b6c07399e3"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d9c8aa35-f2e0-35a7-b424-15b6c07399e3"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cd332bf7-e532-491f-8142-6e97955fae64"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-07-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:01:46.778717+00:00, try_number=1, job_id=803, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-04 00:00:00+00:00 +INFO - Started process 6638 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-07-04T00:00:00+00:00', '--job-id', '803', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpfshduzvz'] +INFO - Job 803: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180704T000000, start_date=20221111T010146, end_date=20221111T010150 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-07-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:01:50.387189Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cd332bf7-e532-491f-8142-6e97955fae64"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..8d225b18 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:01:59.647500Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d9c8aa35-f2e0-35a7-b424-15b6c07399e3"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d9c8aa35-f2e0-35a7-b424-15b6c07399e3"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ed6dd7a5-17db-477f-bea0-ce8b56dd4a43"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-07-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:01:59.647500+00:00, try_number=1, job_id=808, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-04 00:00:00+00:00 +INFO - Started process 6699 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-07-04T00:00:00+00:00', '--job-id', '808', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpi09mqt6h'] +INFO - Job 808: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'HeOOW7K4nPRpAiP2uACbfQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:HeOOW7K4nPRpAiP2uACbfQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010200Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010200Z +20221111/us-east-1/s3/aws4_request +f649fd7463ddd54064a91db7163dcfebf5b924fa9dda04bc82c2ee3f0e7973f8 +INFO - '2022-11-11' - botocore.auth - Signature: +58576ccbbdf47a52a34d781e2c362db2ad01fae0a0c9f157f7e4b1577b5b6df8 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'YVEu/ibUIEP0/fYqjyaI8CprIXbBNh5nFV21sA7q3VJNBuDFdGEBudYSWmSD2ZKkEi/jkvf5zDM=', 'x-amz-request-id': 'G9Q9VRVC3Z3TNRHJ', 'Date': 'Fri, 11 Nov 2022 01:02:00 GMT', 'ETag': '"1de38e5bb2b89cf4690223f6b8009b7d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180704T000000, start_date=20221111T010159, end_date=20221111T010201 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-07-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:02:01.476580Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ed6dd7a5-17db-477f-bea0-ce8b56dd4a43"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..04960fe8 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:01:57.753876Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d9c8aa35-f2e0-35a7-b424-15b6c07399e3"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d9c8aa35-f2e0-35a7-b424-15b6c07399e3"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0a20b7d6-edbb-4394-93fc-ffefcc70ca71"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-07-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:01:57.753876+00:00, try_number=1, job_id=807, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-04 00:00:00+00:00 +INFO - Started process 6652 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-07-04T00:00:00+00:00', '--job-id', '807', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpxobck4zf'] +INFO - Job 807: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499531f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010158Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010158Z +20221111/us-east-1/s3/aws4_request +939c8d1fc0c9d14b507e4c3b9518ad98a9644dfac5f0a60b41d119e1f2fdfe6a +INFO - '2022-11-11' - botocore.auth - Signature: +6f318b1f71acee5b91426931d5d9d7c529e8ff0a45baa324d28f7af2c697348d +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'csXIR9BETqj1kdPkFgTxiMiD81NkroOjMUWyggtiISfugRMAoDZKarMw3takPVZEy8TfbENkNi0=', 'x-amz-request-id': '27Y8PX3140NECTP1', 'Date': 'Fri, 11 Nov 2022 01:01:59 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180704T000000, start_date=20221111T010157, end_date=20221111T010159 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-07-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:01:59.993383Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0a20b7d6-edbb-4394-93fc-ffefcc70ca71"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..e2655e00 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:01:53.278682Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d9c8aa35-f2e0-35a7-b424-15b6c07399e3"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d9c8aa35-f2e0-35a7-b424-15b6c07399e3"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "97121802-c1a4-48c3-ab9f-90cb19f92850"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-07-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:01:53.278682+00:00, try_number=1, job_id=805, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-04 00:00:00+00:00 +INFO - Started process 6646 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-07-04T00:00:00+00:00', '--job-id', '805', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmptyi_3as5'] +INFO - Job 805: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180704T000000, start_date=20221111T010153, end_date=20221111T010158 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-07-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:01:58.142937Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "97121802-c1a4-48c3-ab9f-90cb19f92850"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..1f4ca80e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:01:53.349154Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d9c8aa35-f2e0-35a7-b424-15b6c07399e3"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d9c8aa35-f2e0-35a7-b424-15b6c07399e3"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "dd1c1644-4763-4f97-b455-ca3a27e497b8"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-07-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:01:53.349154+00:00, try_number=1, job_id=806, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-04 00:00:00+00:00 +INFO - Started process 6647 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-07-04T00:00:00+00:00', '--job-id', '806', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp12n_n_0y'] +INFO - Job 806: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180704T000000, start_date=20221111T010153, end_date=20221111T010156 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-07-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:01:56.267608Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "dd1c1644-4763-4f97-b455-ca3a27e497b8"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..912c4baa --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:02:03.594817Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d4f4e7f8-97d5-3bce-80fc-99d15b8befb9"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d4f4e7f8-97d5-3bce-80fc-99d15b8befb9"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3c7c980d-e40a-43ee-9fb3-06677f3031a4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-07-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:02:03.594817+00:00, try_number=1, job_id=809, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-05 00:00:00+00:00 +INFO - Started process 6664 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-07-05T00:00:00+00:00', '--job-id', '809', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp9twn8ee9'] +INFO - Job 809: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180705T000000, start_date=20221111T010203, end_date=20221111T010206 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-07-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:02:06.908235Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3c7c980d-e40a-43ee-9fb3-06677f3031a4"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..abde1c0a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:02:03.591254Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d4f4e7f8-97d5-3bce-80fc-99d15b8befb9"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d4f4e7f8-97d5-3bce-80fc-99d15b8befb9"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a18b399b-4ed4-4bbd-bab3-fa74d0b98a98"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-07-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:02:03.591254+00:00, try_number=1, job_id=810, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-05 00:00:00+00:00 +INFO - Started process 6662 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-07-05T00:00:00+00:00', '--job-id', '810', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpmh047g11'] +INFO - Job 810: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180705T000000, start_date=20221111T010203, end_date=20221111T010206 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-07-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:02:06.882109Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a18b399b-4ed4-4bbd-bab3-fa74d0b98a98"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..ec5edb75 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:02:19.226904Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d4f4e7f8-97d5-3bce-80fc-99d15b8befb9"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d4f4e7f8-97d5-3bce-80fc-99d15b8befb9"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "93634eec-08c5-4e94-9362-2df6788f4b03"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-07-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:02:19.226904+00:00, try_number=1, job_id=814, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-05 00:00:00+00:00 +INFO - Started process 6735 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-07-05T00:00:00+00:00', '--job-id', '814', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpcjcelwk1'] +INFO - Job 814: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'nYTV6KbUOclosMEHLSRxbQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:nYTV6KbUOclosMEHLSRxbQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010220Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010220Z +20221111/us-east-1/s3/aws4_request +ace02413d27c09b83b66c637828578ee3974fc5e280e71d56f720e2ed41a415b +INFO - '2022-11-11' - botocore.auth - Signature: +b790ebed750fc372346282acdd39009131d0f10451a20852cd1442bb1626d1bd +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'e1AbtiTRMGiku/JrFfO/awgxD0SycyqN9W7NhG15JKNdmGznSpRnpY1MeSH9Yh2vUWW0NY4qJVE=', 'x-amz-request-id': 'HQQ9Z5122S1JX95C', 'Date': 'Fri, 11 Nov 2022 01:02:21 GMT', 'ETag': '"9d84d5e8a6d439c968b0c1072d24716d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180705T000000, start_date=20221111T010219, end_date=20221111T010222 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-07-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:02:22.023556Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "93634eec-08c5-4e94-9362-2df6788f4b03"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..ce4b5617 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:02:16.224393Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d4f4e7f8-97d5-3bce-80fc-99d15b8befb9"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d4f4e7f8-97d5-3bce-80fc-99d15b8befb9"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "39ffc9b3-d710-4343-8922-1487a9ee0e88"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-07-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:02:16.224393+00:00, try_number=1, job_id=813, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-05 00:00:00+00:00 +INFO - Started process 6716 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-07-05T00:00:00+00:00', '--job-id', '813', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpwf5ecy8q'] +INFO - Job 813: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa3940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010217Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010217Z +20221111/us-east-1/s3/aws4_request +b11c7206d9b4a4b3c32a2c8b4c5cd5e397904dbc54f62871e2efb876d2166d06 +INFO - '2022-11-11' - botocore.auth - Signature: +04d30a69d75e5811c0e7d53a6f43f73b6c38adf0ac0ab26ddf97ceed19babdf0 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'VqGtfGXdPjXwbik2POb8NbMTezvMGLv8S84vlRWbbMksXCQLtPWupPxgN1Bg+aszp4AmpThTABg=', 'x-amz-request-id': '0Z38EBC823D365CB', 'Date': 'Fri, 11 Nov 2022 01:02:18 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180705T000000, start_date=20221111T010216, end_date=20221111T010219 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-07-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:02:19.005692Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "39ffc9b3-d710-4343-8922-1487a9ee0e88"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..eddeb9a6 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:02:09.117047Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d4f4e7f8-97d5-3bce-80fc-99d15b8befb9"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d4f4e7f8-97d5-3bce-80fc-99d15b8befb9"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ac4a7892-dcd3-4982-be5d-690035b6705b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-07-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:02:09.117047+00:00, try_number=1, job_id=811, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-05 00:00:00+00:00 +INFO - Started process 6710 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-07-05T00:00:00+00:00', '--job-id', '811', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpp5ofkmkx'] +INFO - Job 811: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180705T000000, start_date=20221111T010209, end_date=20221111T010215 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-07-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:02:15.962400Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ac4a7892-dcd3-4982-be5d-690035b6705b"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..7f7b3751 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:02:09.139910Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d4f4e7f8-97d5-3bce-80fc-99d15b8befb9"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d4f4e7f8-97d5-3bce-80fc-99d15b8befb9"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "27188236-baee-41e6-9456-b9c642cee0e9"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-07-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:02:09.139910+00:00, try_number=1, job_id=812, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-05 00:00:00+00:00 +INFO - Started process 6709 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-07-05T00:00:00+00:00', '--job-id', '812', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpb2nplmc6'] +INFO - Job 812: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180705T000000, start_date=20221111T010209, end_date=20221111T010213 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-07-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:02:13.031682Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "27188236-baee-41e6-9456-b9c642cee0e9"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..96e5a4bf --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:02:24.745450Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1a3a5e87-0511-339c-846a-00a09c8be1cb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1a3a5e87-0511-339c-846a-00a09c8be1cb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "09215177-ae04-4e0f-abbc-92ce96825530"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-07-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:02:24.745450+00:00, try_number=1, job_id=816, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-06 00:00:00+00:00 +INFO - Started process 6792 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-07-06T00:00:00+00:00', '--job-id', '816', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpjcp00bf6'] +INFO - Job 816: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180706T000000, start_date=20221111T010224, end_date=20221111T010229 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-07-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:02:29.261921Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "09215177-ae04-4e0f-abbc-92ce96825530"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..46131771 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:02:24.703552Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1a3a5e87-0511-339c-846a-00a09c8be1cb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1a3a5e87-0511-339c-846a-00a09c8be1cb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d71d080b-e8d8-4df6-8f60-1d3236b05711"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-07-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:02:24.703552+00:00, try_number=1, job_id=815, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-06 00:00:00+00:00 +INFO - Started process 6790 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-07-06T00:00:00+00:00', '--job-id', '815', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpoqrt3i8i'] +INFO - Job 815: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180706T000000, start_date=20221111T010224, end_date=20221111T010229 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-07-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:02:29.256765Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d71d080b-e8d8-4df6-8f60-1d3236b05711"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..b8b86d5e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:02:37.149954Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1a3a5e87-0511-339c-846a-00a09c8be1cb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1a3a5e87-0511-339c-846a-00a09c8be1cb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0af51ad9-1143-4466-8325-99d1939db436"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-07-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:02:37.149954+00:00, try_number=1, job_id=820, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-06 00:00:00+00:00 +INFO - Started process 6773 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-07-06T00:00:00+00:00', '--job-id', '820', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpne2_xtlq'] +INFO - Job 820: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'nYTV6KbUOclosMEHLSRxbQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:nYTV6KbUOclosMEHLSRxbQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010238Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010238Z +20221111/us-east-1/s3/aws4_request +0a933753f549f299d7f77b6c8a34367438bd38893e18dd2bde49d21d2446542f +INFO - '2022-11-11' - botocore.auth - Signature: +ee8514c8a75e2a43b56edc5d9d5b5a6710110810055b3d1beef5be3e9f5379de +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '+FTAsuRAuGpfl0FpO78mMA5vXbxWHK7C8EABxDHR0LcD8VLuJ1q/fwaw2vs6w3dX99rkgSgoocQ=', 'x-amz-request-id': '1C2WNWXD4GD4WR64', 'Date': 'Fri, 11 Nov 2022 01:02:38 GMT', 'ETag': '"9d84d5e8a6d439c968b0c1072d24716d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180706T000000, start_date=20221111T010237, end_date=20221111T010239 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-07-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:02:39.320864Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0af51ad9-1143-4466-8325-99d1939db436"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..a52692cb --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:02:35.799221Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1a3a5e87-0511-339c-846a-00a09c8be1cb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1a3a5e87-0511-339c-846a-00a09c8be1cb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "db3f66d3-e196-4081-b71e-c80c5b41460b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-07-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:02:35.799221+00:00, try_number=1, job_id=819, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-06 00:00:00+00:00 +INFO - Started process 6808 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-07-06T00:00:00+00:00', '--job-id', '819', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp3rn1p35p'] +INFO - Job 819: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010236Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010236Z +20221111/us-east-1/s3/aws4_request +774fda26e5692f935ac35d31f4c459c168e4c10ebcedc1175e8a249c493fd4f8 +INFO - '2022-11-11' - botocore.auth - Signature: +63872f48a6ecabc510a46b1190b3ca54cec04ae5982f92804111619ef0899916 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'FyLezvQwNadnihE15J6GLLPZtaX1m7rfg4KPHBO7gghHSdKLGCNYsJCVToOTrfAaQBgBGR6A56I=', 'x-amz-request-id': 'CPBN66ZF0G98ZE99', 'Date': 'Fri, 11 Nov 2022 01:02:37 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180706T000000, start_date=20221111T010235, end_date=20221111T010238 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-07-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:02:38.189464Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "db3f66d3-e196-4081-b71e-c80c5b41460b"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..8cd1a982 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:02:30.887930Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1a3a5e87-0511-339c-846a-00a09c8be1cb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1a3a5e87-0511-339c-846a-00a09c8be1cb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c83b09ee-9661-4b65-8f54-d5a0d4ca6d6f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-07-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:02:30.887930+00:00, try_number=1, job_id=817, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-06 00:00:00+00:00 +INFO - Started process 6800 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-07-06T00:00:00+00:00', '--job-id', '817', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpbx521gn7'] +INFO - Job 817: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180706T000000, start_date=20221111T010230, end_date=20221111T010235 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-07-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:02:35.357370Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c83b09ee-9661-4b65-8f54-d5a0d4ca6d6f"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..db3806bb --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:02:30.897628Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1a3a5e87-0511-339c-846a-00a09c8be1cb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1a3a5e87-0511-339c-846a-00a09c8be1cb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1d856f80-3940-42fb-92eb-36034b58cb27"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-07-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:02:30.897628+00:00, try_number=1, job_id=818, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-06 00:00:00+00:00 +INFO - Started process 6802 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-07-06T00:00:00+00:00', '--job-id', '818', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpiujrj4md'] +INFO - Job 818: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180706T000000, start_date=20221111T010230, end_date=20221111T010234 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-07-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:02:34.382442Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1d856f80-3940-42fb-92eb-36034b58cb27"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..20a43c04 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:02:42.574592Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "423de294-e807-3d75-9356-f3481059d94b"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "423de294-e807-3d75-9356-f3481059d94b"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e72d1a15-5b90-45f6-85ca-e33e1aee7528"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-07-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:02:42.574592+00:00, try_number=1, job_id=822, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-07 00:00:00+00:00 +INFO - Started process 6818 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-07-07T00:00:00+00:00', '--job-id', '822', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpceb4heoi'] +INFO - Job 822: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180707T000000, start_date=20221111T010242, end_date=20221111T010245 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-07-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:02:45.994332Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e72d1a15-5b90-45f6-85ca-e33e1aee7528"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..50298d62 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:02:42.529733Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "423de294-e807-3d75-9356-f3481059d94b"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "423de294-e807-3d75-9356-f3481059d94b"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3f58a6b4-3f55-42dd-adfe-56274add3edd"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-07-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:02:42.529733+00:00, try_number=1, job_id=821, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-07 00:00:00+00:00 +INFO - Started process 6817 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-07-07T00:00:00+00:00', '--job-id', '821', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp8349h0hj'] +INFO - Job 821: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180707T000000, start_date=20221111T010242, end_date=20221111T010246 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-07-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:02:46.008118Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3f58a6b4-3f55-42dd-adfe-56274add3edd"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..e05985d8 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:02:57.833950Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "423de294-e807-3d75-9356-f3481059d94b"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "423de294-e807-3d75-9356-f3481059d94b"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0d806de2-af6b-454e-be0e-dcd2c3b41a17"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-07-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:02:57.833950+00:00, try_number=1, job_id=826, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-07 00:00:00+00:00 +INFO - Started process 6880 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-07-07T00:00:00+00:00', '--job-id', '826', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp0et7yk46'] +INFO - Job 826: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'ujcCHEOMh61kohN1/pnBPg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:ujcCHEOMh61kohN1/pnBPg== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010258Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010258Z +20221111/us-east-1/s3/aws4_request +5db3d823037354f8c20325a8e8cd7a369ac99d4d77b1c1988fa629e5ec70f8ea +INFO - '2022-11-11' - botocore.auth - Signature: +f646e3411f79ab448b01af41744aa1ad02df4a7c798f291681b70978eea27ab8 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'kiKhyID3iuCaHIcZV/OMYIiwtJmv/g6ARSD7mYtPRspLEkCbOrKkwGQbFNxpEc/B8+TfoRFU+GQ=', 'x-amz-request-id': 'YHJB89F2FV36PGB6', 'Date': 'Fri, 11 Nov 2022 01:02:59 GMT', 'ETag': '"ba37021c438c87ad64a21375fe99c13e"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180707T000000, start_date=20221111T010257, end_date=20221111T010259 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-07-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:02:59.739573Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0d806de2-af6b-454e-be0e-dcd2c3b41a17"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..0c6a3b18 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:02:54.273284Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "423de294-e807-3d75-9356-f3481059d94b"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "423de294-e807-3d75-9356-f3481059d94b"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a2746997-a34e-4e24-937d-068f0e838fe9"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-07-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:02:54.273284+00:00, try_number=1, job_id=825, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-07 00:00:00+00:00 +INFO - Started process 6833 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-07-07T00:00:00+00:00', '--job-id', '825', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp6fuupwsb'] +INFO - Job 825: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499543a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010255Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010255Z +20221111/us-east-1/s3/aws4_request +c3c8b5922a0f081858dbd2e77b26a234d27b4a71927647384387e8adf7b933f4 +INFO - '2022-11-11' - botocore.auth - Signature: +afeafdcce8d2d1407aae4742f78e8b02edb9afb7aae564e9474590d84c3593fc +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'nulvbayRwKpxdl0p57ZfkIBueYSLeVffwBQss6kRo9+N1yFVwxbck2irKDcLltpBR6z4XlFlE+I=', 'x-amz-request-id': 'FD6HQFM8BWBD2W04', 'Date': 'Fri, 11 Nov 2022 01:02:56 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180707T000000, start_date=20221111T010254, end_date=20221111T010256 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-07-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:02:56.774192Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a2746997-a34e-4e24-937d-068f0e838fe9"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..62711265 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:02:48.152468Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "423de294-e807-3d75-9356-f3481059d94b"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "423de294-e807-3d75-9356-f3481059d94b"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d93956fa-e3f2-4742-92bf-29921a2c4d2f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-07-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:02:48.152468+00:00, try_number=1, job_id=824, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-07 00:00:00+00:00 +INFO - Started process 6828 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-07-07T00:00:00+00:00', '--job-id', '824', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpunda7ewj'] +INFO - Job 824: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180707T000000, start_date=20221111T010248, end_date=20221111T010255 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-07-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:02:55.994987Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d93956fa-e3f2-4742-92bf-29921a2c4d2f"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..a0f405e6 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:02:48.087085Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "423de294-e807-3d75-9356-f3481059d94b"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "423de294-e807-3d75-9356-f3481059d94b"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "170587a5-f25f-4f2b-92ee-8cd99dfefa26"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-07-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:02:48.087085+00:00, try_number=1, job_id=823, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-07 00:00:00+00:00 +INFO - Started process 6826 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-07-07T00:00:00+00:00', '--job-id', '823', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpgygl8ndo'] +INFO - Job 823: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180707T000000, start_date=20221111T010248, end_date=20221111T010251 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-07-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:02:51.660728Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "170587a5-f25f-4f2b-92ee-8cd99dfefa26"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..32444f3b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:03:03.008142Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bf786979-b160-3ca1-8e71-ba9bc03febeb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bf786979-b160-3ca1-8e71-ba9bc03febeb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "41898ed0-6773-41c7-9df8-c4f0c3bffe90"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-07-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:03:03.008142+00:00, try_number=1, job_id=827, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-08 00:00:00+00:00 +INFO - Started process 6890 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-07-08T00:00:00+00:00', '--job-id', '827', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp59rv2hwh'] +INFO - Job 827: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180708T000000, start_date=20221111T010303, end_date=20221111T010306 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-07-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:03:06.498604Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "41898ed0-6773-41c7-9df8-c4f0c3bffe90"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..be4c1cfa --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:03:03.006331Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bf786979-b160-3ca1-8e71-ba9bc03febeb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bf786979-b160-3ca1-8e71-ba9bc03febeb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a17e0c86-4eb3-41dd-bd50-d175fcaa4521"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-07-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:03:03.006331+00:00, try_number=1, job_id=828, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-08 00:00:00+00:00 +INFO - Started process 6891 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-07-08T00:00:00+00:00', '--job-id', '828', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmprr5o67jy'] +INFO - Job 828: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180708T000000, start_date=20221111T010303, end_date=20221111T010306 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-07-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:03:06.496732Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a17e0c86-4eb3-41dd-bd50-d175fcaa4521"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..e0f02eac --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:03:19.047316Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bf786979-b160-3ca1-8e71-ba9bc03febeb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bf786979-b160-3ca1-8e71-ba9bc03febeb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5a1aab48-b042-4424-bb49-b6b84d60ec2e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-07-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:03:19.047316+00:00, try_number=1, job_id=832, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-08 00:00:00+00:00 +INFO - Started process 6925 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-07-08T00:00:00+00:00', '--job-id', '832', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp6p3l6tcs'] +INFO - Job 832: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'VyNz4KbxuMPyter+vPTjuA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:VyNz4KbxuMPyter+vPTjuA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010320Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010320Z +20221111/us-east-1/s3/aws4_request +3a193d2878174f592c719376671d175dad5638f9886d5985e5ef4322022fd29d +INFO - '2022-11-11' - botocore.auth - Signature: +1d9f439cc948ad02de6a5d0a27ec4e63f6ce10910bcb7163d9b8d5acd92fd4a5 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'H4CjWg1Rw4bHPQIxkN5sYRLakwR1codjWnWefECYqPeCQZogb2Ksq7RND0xIePzLieJU6uZIxyA=', 'x-amz-request-id': '2BD5MBN3ENKXGB6F', 'Date': 'Fri, 11 Nov 2022 01:03:21 GMT', 'ETag': '"572373e0a6f1b8c3f2b5eafebcf4e3b8"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180708T000000, start_date=20221111T010319, end_date=20221111T010322 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-07-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:03:22.467130Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5a1aab48-b042-4424-bb49-b6b84d60ec2e"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..2a457d05 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:03:14.313622Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bf786979-b160-3ca1-8e71-ba9bc03febeb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bf786979-b160-3ca1-8e71-ba9bc03febeb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c17ffb34-240e-454d-b5e8-a63acc56c2ea"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-07-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:03:14.313622+00:00, try_number=1, job_id=831, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-08 00:00:00+00:00 +INFO - Started process 6906 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-07-08T00:00:00+00:00', '--job-id', '831', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmppk2n21_r'] +INFO - Job 831: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499523a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010315Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010315Z +20221111/us-east-1/s3/aws4_request +026b232e8b9fdb8abc7d432ebf0a8a6c58bbca7ec428ae5b712bb28cb81840c4 +INFO - '2022-11-11' - botocore.auth - Signature: +0b29ec926c3fc4d588e2779ac49008bdb1766282b4cc067e244df16b668d3141 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'mybfzsUw5narciPlOExjVAqEUbQvBtly7Lop5/dnhyRhX3vrEEusrhdLev+4+DG9k634WJiOvboK/U88B2mP6A==', 'x-amz-request-id': 'J40KVSAJA0AHANKY', 'Date': 'Fri, 11 Nov 2022 01:03:16 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180708T000000, start_date=20221111T010314, end_date=20221111T010316 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-07-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:03:16.929246Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c17ffb34-240e-454d-b5e8-a63acc56c2ea"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..0c689464 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:03:08.814838Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bf786979-b160-3ca1-8e71-ba9bc03febeb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bf786979-b160-3ca1-8e71-ba9bc03febeb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "57669881-897e-4f5d-8f4b-440f10178a90"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-07-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:03:08.814838+00:00, try_number=1, job_id=830, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-08 00:00:00+00:00 +INFO - Started process 6901 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-07-08T00:00:00+00:00', '--job-id', '830', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpgh3mvcf6'] +INFO - Job 830: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180708T000000, start_date=20221111T010308, end_date=20221111T010316 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-07-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:03:16.307981Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "57669881-897e-4f5d-8f4b-440f10178a90"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..d13e483f --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:03:08.651778Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bf786979-b160-3ca1-8e71-ba9bc03febeb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bf786979-b160-3ca1-8e71-ba9bc03febeb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "46bb3f55-6d96-48a3-a824-55bea52ea559"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-07-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:03:08.651778+00:00, try_number=1, job_id=829, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-08 00:00:00+00:00 +INFO - Started process 6899 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-07-08T00:00:00+00:00', '--job-id', '829', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp6co1lavd'] +INFO - Job 829: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180708T000000, start_date=20221111T010308, end_date=20221111T010312 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-07-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:03:12.388294Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "46bb3f55-6d96-48a3-a824-55bea52ea559"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..24d66912 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:03:25.125930Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "959bf271-e1de-3328-9e05-a8b08fed3daa"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "959bf271-e1de-3328-9e05-a8b08fed3daa"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "42458fe0-0b87-403d-9506-47463f71b157"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-07-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:03:25.125930+00:00, try_number=1, job_id=834, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-09 00:00:00+00:00 +INFO - Started process 6983 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-07-09T00:00:00+00:00', '--job-id', '834', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpxq3z_6wq'] +INFO - Job 834: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180709T000000, start_date=20221111T010325, end_date=20221111T010328 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-07-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:03:28.247534Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "42458fe0-0b87-403d-9506-47463f71b157"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..203ee982 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:03:25.085314Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "959bf271-e1de-3328-9e05-a8b08fed3daa"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "959bf271-e1de-3328-9e05-a8b08fed3daa"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7eac93e0-7154-4c7f-8ac6-b928d56141f3"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-07-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:03:25.085314+00:00, try_number=1, job_id=833, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-09 00:00:00+00:00 +INFO - Started process 6981 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-07-09T00:00:00+00:00', '--job-id', '833', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpiw__te03'] +INFO - Job 833: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180709T000000, start_date=20221111T010325, end_date=20221111T010328 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-07-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:03:28.238938Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7eac93e0-7154-4c7f-8ac6-b928d56141f3"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..653b3d2d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:03:34.824476Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "959bf271-e1de-3328-9e05-a8b08fed3daa"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "959bf271-e1de-3328-9e05-a8b08fed3daa"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e8465273-b1ef-42f0-ad65-62ade4786118"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-07-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:03:34.824476+00:00, try_number=1, job_id=838, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-09 00:00:00+00:00 +INFO - Started process 6991 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-07-09T00:00:00+00:00', '--job-id', '838', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpn0hf39rz'] +INFO - Job 838: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'VyNz4KbxuMPyter+vPTjuA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:VyNz4KbxuMPyter+vPTjuA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010335Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010335Z +20221111/us-east-1/s3/aws4_request +36923b3f7d66e2be0cd95c53518cdc8aa44cb9e2f77355948d7f2d217787e066 +INFO - '2022-11-11' - botocore.auth - Signature: +9ccd429f5ddb725e234ba2fc292e142f211d4616f792d29c88cfa9578ff1e97d +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '73k+5SvYUF1X2OITdI3zxerXpuXRUC0Ugdf6reW0JHig/xamx/CaaOro1KaRT4YbYxr+IDuT12M=', 'x-amz-request-id': 'D95ZV0HBVZFS11SB', 'Date': 'Fri, 11 Nov 2022 01:03:36 GMT', 'ETag': '"572373e0a6f1b8c3f2b5eafebcf4e3b8"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180709T000000, start_date=20221111T010334, end_date=20221111T010336 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-07-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:03:36.866867Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e8465273-b1ef-42f0-ad65-62ade4786118"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..61cfcb13 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:03:34.824512Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "959bf271-e1de-3328-9e05-a8b08fed3daa"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "959bf271-e1de-3328-9e05-a8b08fed3daa"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e143d773-0f18-4e3f-9c7d-0b8e801c2f30"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-07-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:03:34.824512+00:00, try_number=1, job_id=837, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-09 00:00:00+00:00 +INFO - Started process 6993 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-07-09T00:00:00+00:00', '--job-id', '837', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp0pz39u0j'] +INFO - Job 837: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010335Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010335Z +20221111/us-east-1/s3/aws4_request +9df2596072c1f48ee68ece38507725b9719ccf5bd0fb2286e8210045d4c260a8 +INFO - '2022-11-11' - botocore.auth - Signature: +b8d472f2aaf3b1423ad4c2a9eb2e40f68f3760ac2968518e493be955ae4cbc26 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'nJk4NcsWK1xjIsTsOIdQ4hAJ8Scv9RiiKIlRSv2kbuJcdkrGDYdreM1gRjtF68c3fURshL3VO3g=', 'x-amz-request-id': 'D95PW6MPQ8C9S0ZF', 'Date': 'Fri, 11 Nov 2022 01:03:36 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180709T000000, start_date=20221111T010334, end_date=20221111T010337 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-07-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:03:37.354810Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e143d773-0f18-4e3f-9c7d-0b8e801c2f30"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..061ffcac --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:03:29.866418Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "959bf271-e1de-3328-9e05-a8b08fed3daa"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "959bf271-e1de-3328-9e05-a8b08fed3daa"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "003d822f-276f-46ff-b2d4-75257cacceb7"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-07-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:03:29.866418+00:00, try_number=1, job_id=836, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-09 00:00:00+00:00 +INFO - Started process 6917 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-07-09T00:00:00+00:00', '--job-id', '836', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp3xzbvxyg'] +INFO - Job 836: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180709T000000, start_date=20221111T010329, end_date=20221111T010333 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-07-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:03:33.616887Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "003d822f-276f-46ff-b2d4-75257cacceb7"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..5451b30f --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:03:29.868653Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "959bf271-e1de-3328-9e05-a8b08fed3daa"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "959bf271-e1de-3328-9e05-a8b08fed3daa"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cb41be94-0681-429f-aa3a-573fa580c428"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-07-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:03:29.868653+00:00, try_number=1, job_id=835, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-09 00:00:00+00:00 +INFO - Started process 6916 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-07-09T00:00:00+00:00', '--job-id', '835', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp6gxpcc3_'] +INFO - Job 835: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180709T000000, start_date=20221111T010329, end_date=20221111T010333 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-07-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:03:33.038051Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cb41be94-0681-429f-aa3a-573fa580c428"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..72f04b09 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:03:40.002326Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51fedc30-8d56-3d94-b849-554bc74ff7e7"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51fedc30-8d56-3d94-b849-554bc74ff7e7"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ee9ec08b-b533-4c97-8fa4-7d0a44b22c41"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-07-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:03:40.002326+00:00, try_number=1, job_id=839, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-10 00:00:00+00:00 +INFO - Started process 7005 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-07-10T00:00:00+00:00', '--job-id', '839', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp5s75qrvo'] +INFO - Job 839: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180710T000000, start_date=20221111T010340, end_date=20221111T010344 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-07-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:03:44.927185Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ee9ec08b-b533-4c97-8fa4-7d0a44b22c41"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..feaf35be --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:03:40.009661Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51fedc30-8d56-3d94-b849-554bc74ff7e7"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51fedc30-8d56-3d94-b849-554bc74ff7e7"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4e5555e2-1280-4609-8653-a56ce1b4f9a4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-07-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:03:40.009661+00:00, try_number=1, job_id=840, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-10 00:00:00+00:00 +INFO - Started process 7007 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-07-10T00:00:00+00:00', '--job-id', '840', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpdfq9xwrx'] +INFO - Job 840: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180710T000000, start_date=20221111T010340, end_date=20221111T010343 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-07-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:03:43.087658Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4e5555e2-1280-4609-8653-a56ce1b4f9a4"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..52ddcf25 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:03:54.916090Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51fedc30-8d56-3d94-b849-554bc74ff7e7"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51fedc30-8d56-3d94-b849-554bc74ff7e7"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "428992da-fdda-436d-ba9a-ebaaeefd1886"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-07-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:03:54.916090+00:00, try_number=1, job_id=844, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-10 00:00:00+00:00 +INFO - Started process 7086 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-07-10T00:00:00+00:00', '--job-id', '844', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpji9dzvzy'] +INFO - Job 844: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'V2yRLBqLoM2VEiAYT4msng==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:V2yRLBqLoM2VEiAYT4msng== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010355Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010355Z +20221111/us-east-1/s3/aws4_request +f8315c22f96b035ee56ff4b531128941faf1687056a0bdc65d84ce7fd4243866 +INFO - '2022-11-11' - botocore.auth - Signature: +544d2d58cfc3c5bc4a6218cb524cdb8c096a8c8d16d54f8f3e641dbb7fc1b335 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'ygQzFQdyIqUr8L5kI+r3l/hU/x4Ng8YN3YXD+Rz3TeLcY7A/zMGPy/lOnp8IHFfEOkyje25FiWU=', 'x-amz-request-id': 'KS8C873EC8F1EJS3', 'Date': 'Fri, 11 Nov 2022 01:03:56 GMT', 'ETag': '"576c912c1a8ba0cd951220184f89ac9e"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180710T000000, start_date=20221111T010354, end_date=20221111T010357 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-07-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:03:57.121075Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "428992da-fdda-436d-ba9a-ebaaeefd1886"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..dd3fc37e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:03:48.611214Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51fedc30-8d56-3d94-b849-554bc74ff7e7"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51fedc30-8d56-3d94-b849-554bc74ff7e7"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8a059197-1939-455c-9339-851cebfc26d5"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-07-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:03:48.611214+00:00, try_number=1, job_id=843, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-10 00:00:00+00:00 +INFO - Started process 6988 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-07-10T00:00:00+00:00', '--job-id', '843', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpxc73f505'] +INFO - Job 843: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499533a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010349Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010349Z +20221111/us-east-1/s3/aws4_request +3618e92e94408af40f0f7edfb27ad8d0fe107920e0c90b9cbb3a16f015ecbd1d +INFO - '2022-11-11' - botocore.auth - Signature: +99bb396445c895f9f01d0249f72f152a2a4d536bc889b2dad17337206d7b381f +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'QIvtUxKde9fcgzYQcsLtUr6iV7foSoJpv0GQP1scHQjVLy0lvsybFKQdghuzS/xqG506XmX6mv0=', 'x-amz-request-id': 'G8YHYMFPQFD4E8HM', 'Date': 'Fri, 11 Nov 2022 01:03:50 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180710T000000, start_date=20221111T010348, end_date=20221111T010351 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-07-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:03:51.109253Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8a059197-1939-455c-9339-851cebfc26d5"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..d4eaca3e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:03:46.904267Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51fedc30-8d56-3d94-b849-554bc74ff7e7"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51fedc30-8d56-3d94-b849-554bc74ff7e7"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "aebffd13-6721-4505-9de7-3813ffc0102b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-07-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:03:46.904267+00:00, try_number=1, job_id=842, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-10 00:00:00+00:00 +INFO - Started process 7018 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-07-10T00:00:00+00:00', '--job-id', '842', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmprdewwe2d'] +INFO - Job 842: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180710T000000, start_date=20221111T010346, end_date=20221111T010352 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-07-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:03:52.762467Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "aebffd13-6721-4505-9de7-3813ffc0102b"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..8730e89c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:03:44.092414Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51fedc30-8d56-3d94-b849-554bc74ff7e7"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51fedc30-8d56-3d94-b849-554bc74ff7e7"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5919f1e1-a837-44ef-b558-b8d3620002c3"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-07-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:03:44.092414+00:00, try_number=1, job_id=841, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-10 00:00:00+00:00 +INFO - Started process 7012 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-07-10T00:00:00+00:00', '--job-id', '841', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpcvzm4y3u'] +INFO - Job 841: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180710T000000, start_date=20221111T010344, end_date=20221111T010346 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-07-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:03:46.303770Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5919f1e1-a837-44ef-b558-b8d3620002c3"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..f19b0e0e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:03:59.686034Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d0bd09bc-f96f-37b3-b51a-c262a3651cab"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d0bd09bc-f96f-37b3-b51a-c262a3651cab"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7ceaafd1-3d5d-4911-b281-4772c1beb652"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-07-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:03:59.686034+00:00, try_number=1, job_id=845, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-11 00:00:00+00:00 +INFO - Started process 7097 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-07-11T00:00:00+00:00', '--job-id', '845', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp_1d55x3g'] +INFO - Job 845: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180711T000000, start_date=20221111T010359, end_date=20221111T010403 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-07-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:04:03.409520Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7ceaafd1-3d5d-4911-b281-4772c1beb652"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..b78fdf51 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:03:59.733686Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d0bd09bc-f96f-37b3-b51a-c262a3651cab"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d0bd09bc-f96f-37b3-b51a-c262a3651cab"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b3e6f275-5003-411b-9b10-5385486dbe1e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-07-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:03:59.733686+00:00, try_number=1, job_id=846, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-11 00:00:00+00:00 +INFO - Started process 7099 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-07-11T00:00:00+00:00', '--job-id', '846', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmprhg0acd_'] +INFO - Job 846: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180711T000000, start_date=20221111T010359, end_date=20221111T010403 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-07-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:04:03.412698Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b3e6f275-5003-411b-9b10-5385486dbe1e"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..90ea7279 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:04:12.571158Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d0bd09bc-f96f-37b3-b51a-c262a3651cab"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d0bd09bc-f96f-37b3-b51a-c262a3651cab"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1776c872-1564-4ad8-aa78-e850ca9b0c41"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-07-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:04:12.571158+00:00, try_number=1, job_id=850, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-11 00:00:00+00:00 +INFO - Started process 7054 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-07-11T00:00:00+00:00', '--job-id', '850', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpzs1pxfh5'] +INFO - Job 850: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498ee940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'P+aYLupIhoimtmQxWJsWFw==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:P+aYLupIhoimtmQxWJsWFw== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010413Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010413Z +20221111/us-east-1/s3/aws4_request +ad1da5251f592f3cfda93faf82114a765418c3b03a831f3f908fd8473a4d3987 +INFO - '2022-11-11' - botocore.auth - Signature: +a45e92ca957ca641ebcf5ea7a777959c3985b173e301721fe165aef5a67637c7 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'kr1OWvYQraQzGc8HpW+VUCYvZvM+KqSXpbobphvZizwnMECxMYRdt/9FGe/zwE3f4efeQZOiWVQ=', 'x-amz-request-id': 'VVA2AW02GK70CK82', 'Date': 'Fri, 11 Nov 2022 01:04:13 GMT', 'ETag': '"3fe6982eea488688a6b66431589b1617"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180711T000000, start_date=20221111T010412, end_date=20221111T010414 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-07-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:04:14.497622Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1776c872-1564-4ad8-aa78-e850ca9b0c41"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..de000f43 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:04:11.961927Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d0bd09bc-f96f-37b3-b51a-c262a3651cab"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d0bd09bc-f96f-37b3-b51a-c262a3651cab"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "72c80670-8004-4b9a-b218-20437463186e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-07-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:04:11.961927+00:00, try_number=1, job_id=849, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-11 00:00:00+00:00 +INFO - Started process 7049 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-07-11T00:00:00+00:00', '--job-id', '849', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpl47e9x4_'] +INFO - Job 849: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498eff70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010412Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010412Z +20221111/us-east-1/s3/aws4_request +34f67818fe7f4658b6654060390e80a7946f40681f42e7731273504cdf5d861f +INFO - '2022-11-11' - botocore.auth - Signature: +8a2547e78faae3afac8261154c8c4c93dd45460bb37202676d33d8abe6bca6e3 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'UsBvJCGvcCgUGVkpAkvEoFQtPsn/ODF52BLoHxc7MbqCXgoGtGJphP/eHfklHyRcNyznxbwkRkc=', 'x-amz-request-id': 'VVA3C6C5R0MPDVQ2', 'Date': 'Fri, 11 Nov 2022 01:04:13 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180711T000000, start_date=20221111T010411, end_date=20221111T010414 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-07-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:04:14.238824Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "72c80670-8004-4b9a-b218-20437463186e"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..f4d37374 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:04:05.096783Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d0bd09bc-f96f-37b3-b51a-c262a3651cab"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d0bd09bc-f96f-37b3-b51a-c262a3651cab"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6edf86c6-4867-47a1-bb8c-144a4fc64c65"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-07-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:04:05.096783+00:00, try_number=1, job_id=847, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-11 00:00:00+00:00 +INFO - Started process 7108 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-07-11T00:00:00+00:00', '--job-id', '847', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmps_in5cju'] +INFO - Job 847: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180711T000000, start_date=20221111T010405, end_date=20221111T010410 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-07-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:04:10.408681Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6edf86c6-4867-47a1-bb8c-144a4fc64c65"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..6a6a0dc3 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:04:05.094517Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d0bd09bc-f96f-37b3-b51a-c262a3651cab"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d0bd09bc-f96f-37b3-b51a-c262a3651cab"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fae805d8-b73f-4a95-b8d9-e65c0682eae5"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-07-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:04:05.094517+00:00, try_number=1, job_id=848, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-11 00:00:00+00:00 +INFO - Started process 7109 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-07-11T00:00:00+00:00', '--job-id', '848', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp553jgzgr'] +INFO - Job 848: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180711T000000, start_date=20221111T010405, end_date=20221111T010409 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-07-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:04:09.236471Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fae805d8-b73f-4a95-b8d9-e65c0682eae5"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..558115bd --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:04:16.970821Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e399aa79-d9bd-3a2c-9f15-49184fcc6de7"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e399aa79-d9bd-3a2c-9f15-49184fcc6de7"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8dcc6c7f-9143-47da-88d4-57d9851eb0e1"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-07-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:04:16.970821+00:00, try_number=1, job_id=852, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-12 00:00:00+00:00 +INFO - Started process 7078 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-07-12T00:00:00+00:00', '--job-id', '852', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp00eng0dn'] +INFO - Job 852: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180712T000000, start_date=20221111T010416, end_date=20221111T010420 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-07-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:04:20.489748Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8dcc6c7f-9143-47da-88d4-57d9851eb0e1"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..b03c6e7e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:04:16.883233Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e399aa79-d9bd-3a2c-9f15-49184fcc6de7"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e399aa79-d9bd-3a2c-9f15-49184fcc6de7"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7820a774-40dd-4681-ad5a-87bd2b97dbb0"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-07-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:04:16.883233+00:00, try_number=1, job_id=851, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-12 00:00:00+00:00 +INFO - Started process 7076 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-07-12T00:00:00+00:00', '--job-id', '851', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpg91kynch'] +INFO - Job 851: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180712T000000, start_date=20221111T010416, end_date=20221111T010420 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-07-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:04:20.489745Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7820a774-40dd-4681-ad5a-87bd2b97dbb0"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..5dd35366 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:04:32.186186Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e399aa79-d9bd-3a2c-9f15-49184fcc6de7"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e399aa79-d9bd-3a2c-9f15-49184fcc6de7"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fd54cb80-d322-445e-b943-ac37b007eb96"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-07-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:04:32.186186+00:00, try_number=1, job_id=856, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-12 00:00:00+00:00 +INFO - Started process 7180 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-07-12T00:00:00+00:00', '--job-id', '856', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpq8f8uv8s'] +INFO - Job 856: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5ee0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'JBkZN3Ewdl/O2FU5PQ2QIQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:JBkZN3Ewdl/O2FU5PQ2QIQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010433Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010433Z +20221111/us-east-1/s3/aws4_request +3f8fc914eb0b664b9fd27dc9394000d132b12d68aa3c886576495a7f57fabafb +INFO - '2022-11-11' - botocore.auth - Signature: +504f6f98ce7f17f894fe9df403f2ce0237598e4c06ea15c40f2d44224e0100c2 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'fkFuieWmgQvE1Z+2zdJ3YymX/VQxYESy+HU+v/yTJERQkvOmMfePUpmXZyqhaw4m8xoIlHVS8CU=', 'x-amz-request-id': 'WCADX27JAJ7A18PK', 'Date': 'Fri, 11 Nov 2022 01:04:33 GMT', 'ETag': '"241919377130765fced855393d0d9021"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180712T000000, start_date=20221111T010432, end_date=20221111T010434 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-07-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:04:34.604324Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fd54cb80-d322-445e-b943-ac37b007eb96"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..1e92d5e0 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:04:28.298215Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e399aa79-d9bd-3a2c-9f15-49184fcc6de7"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e399aa79-d9bd-3a2c-9f15-49184fcc6de7"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bfeb8f72-e42c-476b-b7e6-ae115cb2cd16"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-07-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:04:28.298215+00:00, try_number=1, job_id=855, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-12 00:00:00+00:00 +INFO - Started process 7093 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-07-12T00:00:00+00:00', '--job-id', '855', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpojyg9bpu'] +INFO - Job 855: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499531f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010429Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010429Z +20221111/us-east-1/s3/aws4_request +6788f9a5fc788ba5757744966309cee271b4d56d780fac64e4779c09bfb15d6b +INFO - '2022-11-11' - botocore.auth - Signature: +373e82e0ab59d5800741e1624ea805252d2b22a8a119b9a7e8a4d3a5825b0ec7 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'eICoBsHVZN2hDHvBgwkdWjvTw4QpVcCPwT/ZVQcA/1oiIG6pdYNAm7oxlimvjcR+0EUEAR2zZHA=', 'x-amz-request-id': 'G8300BNMDDVAK5ZT', 'Date': 'Fri, 11 Nov 2022 01:04:29 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180712T000000, start_date=20221111T010428, end_date=20221111T010430 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-07-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:04:30.484065Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bfeb8f72-e42c-476b-b7e6-ae115cb2cd16"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..3ecc1785 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:04:22.282226Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e399aa79-d9bd-3a2c-9f15-49184fcc6de7"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e399aa79-d9bd-3a2c-9f15-49184fcc6de7"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6009d478-d867-4033-b866-2e7d34f0a04c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-07-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:04:22.282226+00:00, try_number=1, job_id=853, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-12 00:00:00+00:00 +INFO - Started process 7085 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-07-12T00:00:00+00:00', '--job-id', '853', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmprnk5c9_d'] +INFO - Job 853: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180712T000000, start_date=20221111T010422, end_date=20221111T010430 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-07-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:04:30.513274Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6009d478-d867-4033-b866-2e7d34f0a04c"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..6d2c2f4b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:04:22.305372Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e399aa79-d9bd-3a2c-9f15-49184fcc6de7"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e399aa79-d9bd-3a2c-9f15-49184fcc6de7"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "27fcfc30-272f-4b9c-bb24-53c8d1f9f5df"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-07-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:04:22.305372+00:00, try_number=1, job_id=854, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-12 00:00:00+00:00 +INFO - Started process 7088 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-07-12T00:00:00+00:00', '--job-id', '854', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp4xbz_lxo'] +INFO - Job 854: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180712T000000, start_date=20221111T010422, end_date=20221111T010425 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-07-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:04:25.873737Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "27fcfc30-272f-4b9c-bb24-53c8d1f9f5df"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..56ee03aa --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:04:36.970729Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f4af663-756a-36a0-b9aa-db8f32b26b3d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f4af663-756a-36a0-b9aa-db8f32b26b3d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4163db06-f51d-4d2d-b62d-7725a8a8a60d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-07-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:04:36.970729+00:00, try_number=1, job_id=858, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-13 00:00:00+00:00 +INFO - Started process 7104 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-07-13T00:00:00+00:00', '--job-id', '858', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmplkd5b0kz'] +INFO - Job 858: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180713T000000, start_date=20221111T010436, end_date=20221111T010439 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-07-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:04:39.931179Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4163db06-f51d-4d2d-b62d-7725a8a8a60d"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..e67a4d87 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:04:36.970244Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f4af663-756a-36a0-b9aa-db8f32b26b3d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f4af663-756a-36a0-b9aa-db8f32b26b3d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "321b0f61-242f-453d-809b-8bd932fb2c7e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-07-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:04:36.970244+00:00, try_number=1, job_id=857, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-13 00:00:00+00:00 +INFO - Started process 7105 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-07-13T00:00:00+00:00', '--job-id', '857', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpt2t3i_mg'] +INFO - Job 857: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180713T000000, start_date=20221111T010436, end_date=20221111T010439 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-07-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:04:39.935820Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "321b0f61-242f-453d-809b-8bd932fb2c7e"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..1499606d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:04:47.934371Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f4af663-756a-36a0-b9aa-db8f32b26b3d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f4af663-756a-36a0-b9aa-db8f32b26b3d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "65e1e606-d295-4fef-8f89-de6029f5bbf2"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-07-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:04:47.934371+00:00, try_number=1, job_id=862, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-13 00:00:00+00:00 +INFO - Started process 7203 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-07-13T00:00:00+00:00', '--job-id', '862', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpp95pccub'] +INFO - Job 862: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'fGQUEIsJHW1oRihrrEBSKQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:fGQUEIsJHW1oRihrrEBSKQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010448Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010448Z +20221111/us-east-1/s3/aws4_request +62e18620e319c7f120b437dada4fb69c794b75165070651bd080db82d6d7612f +INFO - '2022-11-11' - botocore.auth - Signature: +7b2d9127a50c80668d06eb3831d16a48d9ef3b6f2e98ddd58be4997d6a88b0d2 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'R7S90gl4Gy7/KwVM/wZXoCGQy3WSR5hKHe5WplXPk+rHg9QTNbssWUISEZCwHH/b0YdozNxU3wY=', 'x-amz-request-id': 'XZMSJ4N576XCS1KQ', 'Date': 'Fri, 11 Nov 2022 01:04:49 GMT', 'ETag': '"7c6414108b091d6d6846286bac405229"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180713T000000, start_date=20221111T010447, end_date=20221111T010449 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-07-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:04:49.604332Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "65e1e606-d295-4fef-8f89-de6029f5bbf2"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..dc984353 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:04:46.684236Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f4af663-756a-36a0-b9aa-db8f32b26b3d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f4af663-756a-36a0-b9aa-db8f32b26b3d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7ac5490f-b763-4b69-88db-0b766942eb43"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-07-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:04:46.684236+00:00, try_number=1, job_id=861, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-13 00:00:00+00:00 +INFO - Started process 7197 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-07-13T00:00:00+00:00', '--job-id', '861', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpu8z_tnzx'] +INFO - Job 861: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50071f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010447Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010447Z +20221111/us-east-1/s3/aws4_request +9f4a8a51c90dcf6ebeeb7dc3468339886c10d3578d6b1ba327f76c3d33d2f905 +INFO - '2022-11-11' - botocore.auth - Signature: +01a2eddcead411c8fba5c7986c3a2913f7b3393fd039391a3cc85b828d6e2ed0 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'vS/NLKToS3lIiL+joNSIfkf2bfIqX0PaCTvB3lITxCJXnxJJlcSfKD9TiRR4oi56rQi/bGV6K+A=', 'x-amz-request-id': '4HXTG4BKMVAWS9D1', 'Date': 'Fri, 11 Nov 2022 01:04:48 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180713T000000, start_date=20221111T010446, end_date=20221111T010448 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-07-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:04:48.676299Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7ac5490f-b763-4b69-88db-0b766942eb43"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..0eea526e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:04:42.023717Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f4af663-756a-36a0-b9aa-db8f32b26b3d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f4af663-756a-36a0-b9aa-db8f32b26b3d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bbb68ee2-1d87-4780-8750-f650e2a06467"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-07-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:04:42.023717+00:00, try_number=1, job_id=859, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-13 00:00:00+00:00 +INFO - Started process 7191 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-07-13T00:00:00+00:00', '--job-id', '859', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp9hinhokm'] +INFO - Job 859: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180713T000000, start_date=20221111T010442, end_date=20221111T010446 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-07-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:04:46.766163Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bbb68ee2-1d87-4780-8750-f650e2a06467"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..913af114 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:04:42.021485Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f4af663-756a-36a0-b9aa-db8f32b26b3d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f4af663-756a-36a0-b9aa-db8f32b26b3d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e7ed9f99-cdbb-4802-97c2-2e4ca7beb546"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-07-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:04:42.021485+00:00, try_number=1, job_id=860, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-13 00:00:00+00:00 +INFO - Started process 7188 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-07-13T00:00:00+00:00', '--job-id', '860', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpe2v3af02'] +INFO - Job 860: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180713T000000, start_date=20221111T010442, end_date=20221111T010445 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-07-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:04:45.153837Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e7ed9f99-cdbb-4802-97c2-2e4ca7beb546"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..12cc7e29 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:04:51.771147Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0aa4b54e-fabe-3a57-9c45-dffb7bb1dc9d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0aa4b54e-fabe-3a57-9c45-dffb7bb1dc9d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d11ffe01-5bed-4cc1-9866-5cb689ccd601"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-07-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:04:51.771147+00:00, try_number=1, job_id=864, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-14 00:00:00+00:00 +INFO - Started process 7233 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-07-14T00:00:00+00:00', '--job-id', '864', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp1ll4hanf'] +INFO - Job 864: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180714T000000, start_date=20221111T010451, end_date=20221111T010455 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-07-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:04:55.318959Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d11ffe01-5bed-4cc1-9866-5cb689ccd601"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..6aec5587 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:04:51.599965Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0aa4b54e-fabe-3a57-9c45-dffb7bb1dc9d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0aa4b54e-fabe-3a57-9c45-dffb7bb1dc9d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8cd755dc-3c98-4bf6-8f68-86ab51fec91e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-07-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:04:51.599965+00:00, try_number=1, job_id=863, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-14 00:00:00+00:00 +INFO - Started process 7230 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-07-14T00:00:00+00:00', '--job-id', '863', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpe1v1dq83'] +INFO - Job 863: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180714T000000, start_date=20221111T010451, end_date=20221111T010455 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-07-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:04:55.534403Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8cd755dc-3c98-4bf6-8f68-86ab51fec91e"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..1d1e2a74 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:05:08.694498Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0aa4b54e-fabe-3a57-9c45-dffb7bb1dc9d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0aa4b54e-fabe-3a57-9c45-dffb7bb1dc9d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "92b1f750-1673-4ee7-b5be-ab600dfb1640"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-07-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:05:08.694498+00:00, try_number=1, job_id=868, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-14 00:00:00+00:00 +INFO - Started process 7176 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-07-14T00:00:00+00:00', '--job-id', '868', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp0hcy3igw'] +INFO - Job 868: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'Kl1ZUhBUKNIPqAY2idTN2A==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:Kl1ZUhBUKNIPqAY2idTN2A== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010509Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010509Z +20221111/us-east-1/s3/aws4_request +a57186b455bd2b074f6314053d3a2709fde6fa1043a3f5e185d2e5539708b085 +INFO - '2022-11-11' - botocore.auth - Signature: +65cc5d16b405e7c13b1041d4e3e70063f455dbdcd1a4665be35f001fe9f0ce05 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'QHa6pyk97RkNOSY2Xlbc2QC5NxLQpRkMVPbKhgQiVneAKS4OEUKWDxfHpJV2pZoU79fLKqKAIOw=', 'x-amz-request-id': 'JP6EJCKTJTPKSKR6', 'Date': 'Fri, 11 Nov 2022 01:05:10 GMT', 'ETag': '"2a5d5952105428d20fa8063689d4cdd8"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180714T000000, start_date=20221111T010508, end_date=20221111T010511 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-07-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:05:11.413152Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "92b1f750-1673-4ee7-b5be-ab600dfb1640"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..a33b36b0 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:05:02.713475Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0aa4b54e-fabe-3a57-9c45-dffb7bb1dc9d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0aa4b54e-fabe-3a57-9c45-dffb7bb1dc9d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7ca5214a-786f-4926-8c57-36a4e6d537a0"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-07-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:05:02.713475+00:00, try_number=1, job_id=867, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-14 00:00:00+00:00 +INFO - Started process 7265 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-07-14T00:00:00+00:00', '--job-id', '867', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmphumrjqq0'] +INFO - Job 867: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50071f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010504Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010504Z +20221111/us-east-1/s3/aws4_request +4db8ed930d24bdde9cc5af10cebdaa105eb7a847a861413ced0e7d49da734e7b +INFO - '2022-11-11' - botocore.auth - Signature: +b0ec207491f7c8bf6537a304d7244d5e04383522837b1d139b06e00053679aca +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'VTljgOvRMWCUFwsbVKI0tyb6vJxjIOwXVmoDLeDskxTIX644ZZxdL98j4XdbnJG98lrhvAvg5uY=', 'x-amz-request-id': 'T1XH1VEVGPGSMR0A', 'Date': 'Fri, 11 Nov 2022 01:05:04 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180714T000000, start_date=20221111T010502, end_date=20221111T010505 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-07-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:05:05.483486Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7ca5214a-786f-4926-8c57-36a4e6d537a0"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..93372d41 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:04:57.403411Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0aa4b54e-fabe-3a57-9c45-dffb7bb1dc9d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0aa4b54e-fabe-3a57-9c45-dffb7bb1dc9d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ea7433f1-b875-4d3f-a925-362788fc0378"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-07-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:04:57.403411+00:00, try_number=1, job_id=866, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-14 00:00:00+00:00 +INFO - Started process 7260 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-07-14T00:00:00+00:00', '--job-id', '866', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmprtimz36f'] +INFO - Job 866: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180714T000000, start_date=20221111T010457, end_date=20221111T010505 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-07-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:05:05.922975Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ea7433f1-b875-4d3f-a925-362788fc0378"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..ea253fa5 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:04:56.935494Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0aa4b54e-fabe-3a57-9c45-dffb7bb1dc9d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0aa4b54e-fabe-3a57-9c45-dffb7bb1dc9d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6234de63-f031-4e87-8a0d-1a3f04a29450"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-07-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:04:56.935494+00:00, try_number=1, job_id=865, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-14 00:00:00+00:00 +INFO - Started process 7257 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-07-14T00:00:00+00:00', '--job-id', '865', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpprulpwmr'] +INFO - Job 865: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180714T000000, start_date=20221111T010456, end_date=20221111T010500 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-07-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:05:00.247925Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6234de63-f031-4e87-8a0d-1a3f04a29450"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..bd8d225b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:05:14.132723Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1be4882a-31d6-35f4-9b9c-8958053986a8"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1be4882a-31d6-35f4-9b9c-8958053986a8"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ab2d2b33-f7bc-4c54-9eca-9f17092a3a88"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-07-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:05:14.132723+00:00, try_number=1, job_id=869, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-15 00:00:00+00:00 +INFO - Started process 7236 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-07-15T00:00:00+00:00', '--job-id', '869', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpf_h8zles'] +INFO - Job 869: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180715T000000, start_date=20221111T010514, end_date=20221111T010517 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-07-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:05:17.599015Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ab2d2b33-f7bc-4c54-9eca-9f17092a3a88"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..6b2f3dfd --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:05:14.137357Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1be4882a-31d6-35f4-9b9c-8958053986a8"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1be4882a-31d6-35f4-9b9c-8958053986a8"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "13280e4a-6fcd-408a-901d-09dbf8ed9d1e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-07-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:05:14.137357+00:00, try_number=1, job_id=870, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-15 00:00:00+00:00 +INFO - Started process 7237 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-07-15T00:00:00+00:00', '--job-id', '870', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpnn77e73_'] +INFO - Job 870: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180715T000000, start_date=20221111T010514, end_date=20221111T010517 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-07-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:05:17.596603Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "13280e4a-6fcd-408a-901d-09dbf8ed9d1e"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..eae34e5e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:05:33.408685Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1be4882a-31d6-35f4-9b9c-8958053986a8"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1be4882a-31d6-35f4-9b9c-8958053986a8"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "27348b74-f818-4e65-9075-a1435f26ac4d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-07-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:05:33.408685+00:00, try_number=1, job_id=874, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-15 00:00:00+00:00 +INFO - Started process 7290 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-07-15T00:00:00+00:00', '--job-id', '874', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpyh0613a6'] +INFO - Job 874: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'tQlmTHg81Ktd22wQWPuq4g==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:tQlmTHg81Ktd22wQWPuq4g== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010534Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010534Z +20221111/us-east-1/s3/aws4_request +4f9d0f24d817a45e99e189b7b4314b82c7aab1eb1589ee4783cdd25da7144206 +INFO - '2022-11-11' - botocore.auth - Signature: +636712f04b9deaf7a267e8988cda900a77f2137f596a29da66ad4f4341cf8e9e +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '26nwmB55cAzlPHKjFRtngby9UoO+ckvVoPQr3zFot2QbCElj6sQG1jiOPZXI/Okdh0YvHbVUpa0=', 'x-amz-request-id': 'WD7D3BF13002RHTC', 'Date': 'Fri, 11 Nov 2022 01:05:34 GMT', 'ETag': '"b509664c783cd4ab5ddb6c1058fbaae2"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180715T000000, start_date=20221111T010533, end_date=20221111T010535 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-07-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:05:35.662815Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "27348b74-f818-4e65-9075-a1435f26ac4d"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..72f72fd9 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:05:27.154197Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1be4882a-31d6-35f4-9b9c-8958053986a8"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1be4882a-31d6-35f4-9b9c-8958053986a8"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "92b6693a-7d26-4a93-a12c-e6bb9ffb0ec4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-07-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:05:27.154197+00:00, try_number=1, job_id=873, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-15 00:00:00+00:00 +INFO - Started process 7282 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-07-15T00:00:00+00:00', '--job-id', '873', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp3m9otkvl'] +INFO - Job 873: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50071f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010528Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010528Z +20221111/us-east-1/s3/aws4_request +2481e02a92143b6196ec4279ef77b1c3b4980d11bdd17e081273f3739e4b4a78 +INFO - '2022-11-11' - botocore.auth - Signature: +902e3d90f135bb1f06ad0305460831c28705373ce79addb854c9a38254203883 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'vRRARnxQz3R6lYA1J54I0MYyl/odQNOIY/t8Yr0IvOj/om6H8q9lZaPK7jnaKBQeW/LN4Vkag/8=', 'x-amz-request-id': '2DZQPFW1RY13EC3S', 'Date': 'Fri, 11 Nov 2022 01:05:29 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180715T000000, start_date=20221111T010527, end_date=20221111T010530 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-07-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:05:30.560836Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "92b6693a-7d26-4a93-a12c-e6bb9ffb0ec4"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..71c66b3a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:05:20.669658Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1be4882a-31d6-35f4-9b9c-8958053986a8"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1be4882a-31d6-35f4-9b9c-8958053986a8"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "27a4da25-5a41-4c4b-8d8b-047500bab9fe"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-07-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:05:20.669658+00:00, try_number=1, job_id=871, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-15 00:00:00+00:00 +INFO - Started process 7276 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-07-15T00:00:00+00:00', '--job-id', '871', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpxmelal_n'] +INFO - Job 871: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180715T000000, start_date=20221111T010520, end_date=20221111T010531 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-07-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:05:31.418728Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "27a4da25-5a41-4c4b-8d8b-047500bab9fe"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..a2482288 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:05:20.680491Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1be4882a-31d6-35f4-9b9c-8958053986a8"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "1be4882a-31d6-35f4-9b9c-8958053986a8"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "523575a9-5737-4835-b84b-2a2df36463c1"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-07-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:05:20.680491+00:00, try_number=1, job_id=872, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-15 00:00:00+00:00 +INFO - Started process 7277 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-07-15T00:00:00+00:00', '--job-id', '872', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpvc55nx8g'] +INFO - Job 872: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180715T000000, start_date=20221111T010520, end_date=20221111T010524 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-07-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:05:24.418894Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "523575a9-5737-4835-b84b-2a2df36463c1"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..4d8c8381 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:05:39.028243Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ce0876db-2cd9-3ae5-84cb-f0f6e0243cfa"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ce0876db-2cd9-3ae5-84cb-f0f6e0243cfa"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "03170541-d0e0-4211-9119-577aba119ca8"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-07-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:05:39.028243+00:00, try_number=1, job_id=876, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-16 00:00:00+00:00 +INFO - Started process 7262 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-07-16T00:00:00+00:00', '--job-id', '876', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp4s7g2q3s'] +INFO - Job 876: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180716T000000, start_date=20221111T010539, end_date=20221111T010542 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-07-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:05:42.669258Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "03170541-d0e0-4211-9119-577aba119ca8"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..7da47eb5 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:05:38.364290Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ce0876db-2cd9-3ae5-84cb-f0f6e0243cfa"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ce0876db-2cd9-3ae5-84cb-f0f6e0243cfa"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "90fc5322-dc39-492b-9dfd-59df103e74a5"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-07-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:05:38.364290+00:00, try_number=1, job_id=875, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-16 00:00:00+00:00 +INFO - Started process 7259 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-07-16T00:00:00+00:00', '--job-id', '875', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpjb2jlkp5'] +INFO - Job 875: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180716T000000, start_date=20221111T010538, end_date=20221111T010542 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-07-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:05:42.630367Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "90fc5322-dc39-492b-9dfd-59df103e74a5"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..53ee8ee6 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:05:57.467978Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ce0876db-2cd9-3ae5-84cb-f0f6e0243cfa"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ce0876db-2cd9-3ae5-84cb-f0f6e0243cfa"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "300a8d7b-783d-4bae-9d8f-fefa5947743d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-07-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:05:57.467978+00:00, try_number=1, job_id=880, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-16 00:00:00+00:00 +INFO - Started process 7343 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-07-16T00:00:00+00:00', '--job-id', '880', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpo4jnu1kn'] +INFO - Job 880: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'mPt6BoprFQoKViPsEuW0iQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:mPt6BoprFQoKViPsEuW0iQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010558Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010558Z +20221111/us-east-1/s3/aws4_request +809c28a3a207bbd2bd1081853bb148d4564e0ce0b9152f5c42e5d2f564738f80 +INFO - '2022-11-11' - botocore.auth - Signature: +df6aa87081a6d84ed747f736cfeb84cc60a73764acd43b3885dd9ae2faaa3bab +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'jWwTislrVeZuwHB4OToPmXVWsWTlWODo4vbtJERa6BLgvK3TFJRJ6EzUY5OqsSVAYBYGSFiUjl4=', 'x-amz-request-id': 'D55VKRHQNFFPNCKW', 'Date': 'Fri, 11 Nov 2022 01:05:58 GMT', 'ETag': '"98fb7a068a6b150a0a5623ec12e5b489"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180716T000000, start_date=20221111T010557, end_date=20221111T010559 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-07-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:05:59.579355Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "300a8d7b-783d-4bae-9d8f-fefa5947743d"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..2d23de54 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:05:53.670930Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ce0876db-2cd9-3ae5-84cb-f0f6e0243cfa"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ce0876db-2cd9-3ae5-84cb-f0f6e0243cfa"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "22c977e6-3a88-42f7-a35b-73c955da7442"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-07-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:05:53.670930+00:00, try_number=1, job_id=879, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-16 00:00:00+00:00 +INFO - Started process 7362 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-07-16T00:00:00+00:00', '--job-id', '879', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmparsezqxc'] +INFO - Job 879: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50061f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010554Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010554Z +20221111/us-east-1/s3/aws4_request +47e8dff900bbb1b8c266fa1f52bc61978f5968b74de7860461bb009aa82f6448 +INFO - '2022-11-11' - botocore.auth - Signature: +8ff01dbfea392b1ef87b4fcb4e7e81b90b9864d59e5f7fba9f5ed87cc3268564 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'L+0gYrOMNT+tR+ISM8FHuq+XVni2vqp8uIJJrx109NMCYMyB9Lsa8J0MxSEWBYC7LrD4aAzmy10=', 'x-amz-request-id': 'NSX0NXGZAZDWSVA5', 'Date': 'Fri, 11 Nov 2022 01:05:55 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180716T000000, start_date=20221111T010553, end_date=20221111T010556 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-07-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:05:56.328794Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "22c977e6-3a88-42f7-a35b-73c955da7442"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..520001c4 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:05:46.819307Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ce0876db-2cd9-3ae5-84cb-f0f6e0243cfa"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ce0876db-2cd9-3ae5-84cb-f0f6e0243cfa"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "97857c18-2b93-4fe8-b49c-d96c42f681fc"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-07-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:05:46.819307+00:00, try_number=1, job_id=877, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-16 00:00:00+00:00 +INFO - Started process 7333 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-07-16T00:00:00+00:00', '--job-id', '877', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp0uuxhpjg'] +INFO - Job 877: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180716T000000, start_date=20221111T010546, end_date=20221111T010555 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-07-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:05:55.698525Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "97857c18-2b93-4fe8-b49c-d96c42f681fc"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..950c1a3a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:05:46.880158Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ce0876db-2cd9-3ae5-84cb-f0f6e0243cfa"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ce0876db-2cd9-3ae5-84cb-f0f6e0243cfa"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "73344a65-c5f7-425b-b69e-69dbaedb1432"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-07-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:05:46.880158+00:00, try_number=1, job_id=878, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-16 00:00:00+00:00 +INFO - Started process 7335 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-07-16T00:00:00+00:00', '--job-id', '878', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp0o4sp0pg'] +INFO - Job 878: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180716T000000, start_date=20221111T010546, end_date=20221111T010550 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-07-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:05:50.325269Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "73344a65-c5f7-425b-b69e-69dbaedb1432"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..40bfcbec --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:06:01.903797Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a8e6be02-f599-3f25-889d-036cb10b481c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a8e6be02-f599-3f25-889d-036cb10b481c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "94c2bfb8-04cd-491e-87dd-a3e0d2c8868e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-07-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:06:01.903797+00:00, try_number=1, job_id=881, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-17 00:00:00+00:00 +INFO - Started process 7351 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-07-17T00:00:00+00:00', '--job-id', '881', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmppv8sfuou'] +INFO - Job 881: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180717T000000, start_date=20221111T010601, end_date=20221111T010605 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-07-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:06:05.454177Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "94c2bfb8-04cd-491e-87dd-a3e0d2c8868e"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..bfa1649c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:06:01.973361Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a8e6be02-f599-3f25-889d-036cb10b481c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a8e6be02-f599-3f25-889d-036cb10b481c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4979b6a9-213b-4cfd-bd91-239b64775410"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-07-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:06:01.973361+00:00, try_number=1, job_id=882, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-17 00:00:00+00:00 +INFO - Started process 7354 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-07-17T00:00:00+00:00', '--job-id', '882', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmphxa3qede'] +INFO - Job 882: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180717T000000, start_date=20221111T010601, end_date=20221111T010605 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-07-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:06:05.447426Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4979b6a9-213b-4cfd-bd91-239b64775410"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..0a6d4f6a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:06:17.254556Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a8e6be02-f599-3f25-889d-036cb10b481c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a8e6be02-f599-3f25-889d-036cb10b481c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2e346251-4e54-48a0-837a-e65e040b6398"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-07-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:06:17.254556+00:00, try_number=1, job_id=886, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-17 00:00:00+00:00 +INFO - Started process 7377 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-07-17T00:00:00+00:00', '--job-id', '886', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpt5h2xedw'] +INFO - Job 886: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0ca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'AGl41POaq4lYXPswO8OH4A==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:AGl41POaq4lYXPswO8OH4A== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010618Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010618Z +20221111/us-east-1/s3/aws4_request +a3c29f1f2262a053b23bbfd73101311727c6b65966892f5edc32f3072ff16194 +INFO - '2022-11-11' - botocore.auth - Signature: +d2b2f1540d7f3f0d96c2f7ed790b775ad38e0b1ecd4ca6f4ed03e8bb8f646558 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'VHpEWJQGNzDM343KDdP9yybGJ9H2AixnIRrAGvStMUg6X4dkWMekEOzBfVSqCZ54VL+fS6Pp+eE=', 'x-amz-request-id': 'GDNNJ7TJCA3XE7E7', 'Date': 'Fri, 11 Nov 2022 01:06:18 GMT', 'ETag': '"006978d4f39aab89585cfb303bc387e0"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180717T000000, start_date=20221111T010617, end_date=20221111T010619 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-07-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:06:19.471051Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2e346251-4e54-48a0-837a-e65e040b6398"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..9a89e342 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:06:13.558588Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a8e6be02-f599-3f25-889d-036cb10b481c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a8e6be02-f599-3f25-889d-036cb10b481c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7241b15a-82fa-4bb1-8004-670f11e36f02"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-07-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:06:13.558588+00:00, try_number=1, job_id=885, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-17 00:00:00+00:00 +INFO - Started process 7369 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-07-17T00:00:00+00:00', '--job-id', '885', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp0auui4vh'] +INFO - Job 885: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499543a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010614Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010614Z +20221111/us-east-1/s3/aws4_request +af956230424fc8e8f85b75afb10028b9df11f63eb209ad1bd35b2df8c452ff65 +INFO - '2022-11-11' - botocore.auth - Signature: +a603664f16bc745e1582ca4bb4cb9a76de4e8543879a0654d5584464856237aa +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'b5ayWfgdTONjoJC4bzY7orc34YYhMkRPBTjvCmc/A3sfDlpAtYcxBKbbL82bb8CskoMyLoGsmbw=', 'x-amz-request-id': '6V0WSHJ3XFMZT2W4', 'Date': 'Fri, 11 Nov 2022 01:06:15 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180717T000000, start_date=20221111T010613, end_date=20221111T010616 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-07-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:06:16.145337Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7241b15a-82fa-4bb1-8004-670f11e36f02"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..800e71e7 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:06:07.453373Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a8e6be02-f599-3f25-889d-036cb10b481c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a8e6be02-f599-3f25-889d-036cb10b481c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2fffee47-0a43-44ac-a17d-eeed4087e132"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-07-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:06:07.453373+00:00, try_number=1, job_id=883, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-17 00:00:00+00:00 +INFO - Started process 7361 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-07-17T00:00:00+00:00', '--job-id', '883', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpcarh34e1'] +INFO - Job 883: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180717T000000, start_date=20221111T010607, end_date=20221111T010615 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-07-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:06:15.149697Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2fffee47-0a43-44ac-a17d-eeed4087e132"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..08768505 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:06:07.928820Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a8e6be02-f599-3f25-889d-036cb10b481c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a8e6be02-f599-3f25-889d-036cb10b481c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "61b0053f-9d5e-4b15-abed-09d18e3b8f6d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-07-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:06:07.928820+00:00, try_number=1, job_id=884, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-17 00:00:00+00:00 +INFO - Started process 7364 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-07-17T00:00:00+00:00', '--job-id', '884', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpvcu86gqv'] +INFO - Job 884: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180717T000000, start_date=20221111T010607, end_date=20221111T010611 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-07-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:06:11.478421Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "61b0053f-9d5e-4b15-abed-09d18e3b8f6d"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..1105d13f --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:06:21.666669Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d486e9f7-28b0-39bc-bd20-863c2de533bb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d486e9f7-28b0-39bc-bd20-863c2de533bb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e5b70b8e-bd8e-4fc0-a48c-9c89b134f9fd"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-07-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:06:21.666669+00:00, try_number=1, job_id=888, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-18 00:00:00+00:00 +INFO - Started process 7438 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-07-18T00:00:00+00:00', '--job-id', '888', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpcv42zqzo'] +INFO - Job 888: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180718T000000, start_date=20221111T010621, end_date=20221111T010625 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-07-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:06:25.231580Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e5b70b8e-bd8e-4fc0-a48c-9c89b134f9fd"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..4f320773 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:06:21.587121Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d486e9f7-28b0-39bc-bd20-863c2de533bb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d486e9f7-28b0-39bc-bd20-863c2de533bb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "35a40f90-180a-42c7-b5cb-e7a987fa9555"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-07-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:06:21.587121+00:00, try_number=1, job_id=887, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-18 00:00:00+00:00 +INFO - Started process 7436 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-07-18T00:00:00+00:00', '--job-id', '887', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmphfzf8865'] +INFO - Job 887: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180718T000000, start_date=20221111T010621, end_date=20221111T010625 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-07-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:06:25.144720Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "35a40f90-180a-42c7-b5cb-e7a987fa9555"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..00b2f8b7 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:06:40.522151Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d486e9f7-28b0-39bc-bd20-863c2de533bb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d486e9f7-28b0-39bc-bd20-863c2de533bb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3350cf7c-3005-43c2-93a0-b140c43aca40"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-07-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:06:40.522151+00:00, try_number=1, job_id=892, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-18 00:00:00+00:00 +INFO - Started process 7456 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-07-18T00:00:00+00:00', '--job-id', '892', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpoq1sgdow'] +INFO - Job 892: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0ca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'AGl41POaq4lYXPswO8OH4A==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:AGl41POaq4lYXPswO8OH4A== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010641Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010641Z +20221111/us-east-1/s3/aws4_request +9a61da2f79f95c3af5c5b39326e036aaa311b77a9b3479f933d5f4346d5659d7 +INFO - '2022-11-11' - botocore.auth - Signature: +9f77b0a102f5c2b9f407c7c1f30c90085556a3f9b48bcab54851efa9b1bc3286 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'U6RruDn9U77lxJyurDH1qrr2vNyFVF9KgE99LxmCT7ZoWKdpI57y+0lRZZHfhBRqsF3KcCr0rvw=', 'x-amz-request-id': '81A9TPSMRQW96953', 'Date': 'Fri, 11 Nov 2022 01:06:41 GMT', 'ETag': '"006978d4f39aab89585cfb303bc387e0"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180718T000000, start_date=20221111T010640, end_date=20221111T010642 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-07-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:06:42.536569Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3350cf7c-3005-43c2-93a0-b140c43aca40"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..724c8756 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:06:32.699871Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d486e9f7-28b0-39bc-bd20-863c2de533bb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d486e9f7-28b0-39bc-bd20-863c2de533bb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8caade75-1c0e-4578-bc32-723f6b8818f4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-07-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:06:32.699871+00:00, try_number=1, job_id=891, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-18 00:00:00+00:00 +INFO - Started process 7384 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-07-18T00:00:00+00:00', '--job-id', '891', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp6xnz7p60'] +INFO - Job 891: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499533a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010633Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010633Z +20221111/us-east-1/s3/aws4_request +8489ef7cdcf0458654a119305867504c0a4094aa9622f66aefadb7fd4ecf34ed +INFO - '2022-11-11' - botocore.auth - Signature: +b7de21bd01528e943cc73805b562bc97545c897485cb54a647d13bc18d09737f +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'g1tGcyF5quo8S1SWhQ3aVKh2wnKw7IaivcHXIveJf+RxnSiUqrTc5+B+jyfxmoGVM86X29r+A48=', 'x-amz-request-id': 'CSCERFFTVKSBEWQQ', 'Date': 'Fri, 11 Nov 2022 01:06:34 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180718T000000, start_date=20221111T010632, end_date=20221111T010634 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-07-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:06:34.870370Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8caade75-1c0e-4578-bc32-723f6b8818f4"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..e38ab34b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:06:27.532390Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d486e9f7-28b0-39bc-bd20-863c2de533bb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d486e9f7-28b0-39bc-bd20-863c2de533bb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bc96376a-cf86-489a-be55-0aa118c9b508"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-07-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:06:27.532390+00:00, try_number=1, job_id=890, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-18 00:00:00+00:00 +INFO - Started process 7448 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-07-18T00:00:00+00:00', '--job-id', '890', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp3tifivpl'] +INFO - Job 890: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180718T000000, start_date=20221111T010627, end_date=20221111T010638 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-07-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:06:38.518571Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bc96376a-cf86-489a-be55-0aa118c9b508"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..39dff4b3 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:06:27.385929Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d486e9f7-28b0-39bc-bd20-863c2de533bb"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d486e9f7-28b0-39bc-bd20-863c2de533bb"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "13ff857c-944d-48a5-9def-16bf7166fe70"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-07-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:06:27.385929+00:00, try_number=1, job_id=889, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-18 00:00:00+00:00 +INFO - Started process 7445 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-07-18T00:00:00+00:00', '--job-id', '889', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpqvs2goaq'] +INFO - Job 889: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180718T000000, start_date=20221111T010627, end_date=20221111T010630 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-07-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:06:30.462194Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "13ff857c-944d-48a5-9def-16bf7166fe70"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..f3d44938 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:06:44.987380Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "68b8c7a5-3189-37d3-8cd7-ee5d757af3f4"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "68b8c7a5-3189-37d3-8cd7-ee5d757af3f4"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "294a85b6-1ae3-4e64-81dd-65a55d754a6f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-07-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:06:44.987380+00:00, try_number=1, job_id=894, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-19 00:00:00+00:00 +INFO - Started process 7523 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-07-19T00:00:00+00:00', '--job-id', '894', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp93uupjol'] +INFO - Job 894: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180719T000000, start_date=20221111T010644, end_date=20221111T010648 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-07-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:06:48.185371Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "294a85b6-1ae3-4e64-81dd-65a55d754a6f"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..c809698d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:06:44.907223Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "68b8c7a5-3189-37d3-8cd7-ee5d757af3f4"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "68b8c7a5-3189-37d3-8cd7-ee5d757af3f4"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a4462764-6405-4b72-aa7e-f7f28ae179f3"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-07-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:06:44.907223+00:00, try_number=1, job_id=893, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-19 00:00:00+00:00 +INFO - Started process 7521 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-07-19T00:00:00+00:00', '--job-id', '893', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpjp2usvt3'] +INFO - Job 893: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180719T000000, start_date=20221111T010644, end_date=20221111T010648 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-07-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:06:48.192520Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a4462764-6405-4b72-aa7e-f7f28ae179f3"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..1ba3c0d3 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:06:54.926371Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "68b8c7a5-3189-37d3-8cd7-ee5d757af3f4"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "68b8c7a5-3189-37d3-8cd7-ee5d757af3f4"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "08d6ecff-323b-47a9-b584-57d41b1deb3b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-07-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:06:54.926371+00:00, try_number=1, job_id=898, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-19 00:00:00+00:00 +INFO - Started process 7545 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-07-19T00:00:00+00:00', '--job-id', '898', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmptbi19psb'] +INFO - Job 898: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'd3c81tEJ8IVs4EEucr9tIg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:d3c81tEJ8IVs4EEucr9tIg== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010655Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010655Z +20221111/us-east-1/s3/aws4_request +e7ed8451ef0c372ffef3fc0bfd752deb4da2a514767ab5dcdcbdcee25c5c0e41 +INFO - '2022-11-11' - botocore.auth - Signature: +b3e5789111c7ed7f19d1af9bacf16967ddc877880b522b9c8fe3dedd9604b16d +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'Mr7arHdI27JZsxMDgQEvWQURH8WUuMQXo2c2U+rHx3I5+dvJsyE5VQh7ge1gFmgbs0dczv71jtg=', 'x-amz-request-id': '6W0SGW0QHCXRFKY7', 'Date': 'Fri, 11 Nov 2022 01:06:56 GMT', 'ETag': '"77773cd6d109f0856ce0412e72bf6d22"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180719T000000, start_date=20221111T010654, end_date=20221111T010656 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-07-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:06:56.648538Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "08d6ecff-323b-47a9-b584-57d41b1deb3b"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..e5742d62 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:06:53.896787Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "68b8c7a5-3189-37d3-8cd7-ee5d757af3f4"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "68b8c7a5-3189-37d3-8cd7-ee5d757af3f4"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3b4f2a4b-7dc7-4152-8ee6-9340ed539224"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-07-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:06:53.896787+00:00, try_number=1, job_id=897, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-19 00:00:00+00:00 +INFO - Started process 7540 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-07-19T00:00:00+00:00', '--job-id', '897', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp9nqu4lm6'] +INFO - Job 897: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010654Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010654Z +20221111/us-east-1/s3/aws4_request +d6dadac290616671b0a3f1ac5992d838dec32983e3443c36825d45a9ac856cb2 +INFO - '2022-11-11' - botocore.auth - Signature: +6f8f87602534fc62861e34d852c577a14aed3fd5a8144e4e7f04ab7d3793414c +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'Svwzg57lKYYs4vlD3QpnpZgS8bICSMwLNuSMBpLr7QrPXe30ueJzxQAko8h0tyr2F6OIGGahhwc=', 'x-amz-request-id': 'FM075CVGHMZ47RQK', 'Date': 'Fri, 11 Nov 2022 01:06:55 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180719T000000, start_date=20221111T010653, end_date=20221111T010655 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-07-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:06:55.892405Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3b4f2a4b-7dc7-4152-8ee6-9340ed539224"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..150dd879 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:06:49.455926Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "68b8c7a5-3189-37d3-8cd7-ee5d757af3f4"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "68b8c7a5-3189-37d3-8cd7-ee5d757af3f4"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "22f121f8-c228-4a66-800a-e1287a55f92b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-07-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:06:49.455926+00:00, try_number=1, job_id=895, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-19 00:00:00+00:00 +INFO - Started process 7530 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-07-19T00:00:00+00:00', '--job-id', '895', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmplv56zrh2'] +INFO - Job 895: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180719T000000, start_date=20221111T010649, end_date=20221111T010653 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-07-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:06:53.656718Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "22f121f8-c228-4a66-800a-e1287a55f92b"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..d6cb100a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:06:49.578771Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "68b8c7a5-3189-37d3-8cd7-ee5d757af3f4"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "68b8c7a5-3189-37d3-8cd7-ee5d757af3f4"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6a80fe16-4370-4e81-8a39-0622de536db3"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-07-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:06:49.578771+00:00, try_number=1, job_id=896, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-19 00:00:00+00:00 +INFO - Started process 7533 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-07-19T00:00:00+00:00', '--job-id', '896', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp7zp7f18z'] +INFO - Job 896: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180719T000000, start_date=20221111T010649, end_date=20221111T010652 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-07-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:06:52.419067Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6a80fe16-4370-4e81-8a39-0622de536db3"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..70d74ee3 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:06:59.941867Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "15ba5c1d-ac0e-3943-818a-4b00424fd31e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "15ba5c1d-ac0e-3943-818a-4b00424fd31e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5df3b659-51aa-4dc8-ba53-55b3d52f68f6"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-07-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:06:59.941867+00:00, try_number=1, job_id=899, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-20 00:00:00+00:00 +INFO - Started process 7467 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-07-20T00:00:00+00:00', '--job-id', '899', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp_5dr5kk1'] +INFO - Job 899: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180720T000000, start_date=20221111T010659, end_date=20221111T010703 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-07-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:07:03.083899Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5df3b659-51aa-4dc8-ba53-55b3d52f68f6"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..5e5016a5 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:06:59.937603Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "15ba5c1d-ac0e-3943-818a-4b00424fd31e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "15ba5c1d-ac0e-3943-818a-4b00424fd31e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "45c9f004-74a6-416e-83de-dc8280b5e975"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-07-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:06:59.937603+00:00, try_number=1, job_id=900, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-20 00:00:00+00:00 +INFO - Started process 7465 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-07-20T00:00:00+00:00', '--job-id', '900', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpauaqj2jn'] +INFO - Job 900: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180720T000000, start_date=20221111T010659, end_date=20221111T010703 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-07-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:07:03.162289Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "45c9f004-74a6-416e-83de-dc8280b5e975"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..d589d2e9 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:07:10.648517Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "15ba5c1d-ac0e-3943-818a-4b00424fd31e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "15ba5c1d-ac0e-3943-818a-4b00424fd31e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f4d8cbb0-3ffd-4662-884c-3a68651bcf7b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-07-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:07:10.648517+00:00, try_number=1, job_id=904, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-20 00:00:00+00:00 +INFO - Started process 7578 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-07-20T00:00:00+00:00', '--job-id', '904', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpycngap4j'] +INFO - Job 904: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'g5L3XKG636Gw3wMt4dkhyA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:g5L3XKG636Gw3wMt4dkhyA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010711Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010711Z +20221111/us-east-1/s3/aws4_request +7b0ca4ed934ac60269cb03393e1ac2aeaadbc9886bc8deca64b44749d20e9056 +INFO - '2022-11-11' - botocore.auth - Signature: +78e9da6d97a5d9b65170b36476c1e8d7f6d088250b9dd52dd1998a887c9a60d7 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'KTNwmxwm5jc4Yg1U0Nxo/PifUKFykJYmsPMthLAvEvB5zEmz7/LA/JNVovmfYRnaYjIXcyJ3SqM=', 'x-amz-request-id': 'GASBZ9RAG02P24B2', 'Date': 'Fri, 11 Nov 2022 01:07:12 GMT', 'ETag': '"8392f75ca1badfa1b0df032de1d921c8"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180720T000000, start_date=20221111T010710, end_date=20221111T010713 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-07-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:07:13.386913Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f4d8cbb0-3ffd-4662-884c-3a68651bcf7b"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..4c250ad8 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:07:10.286630Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "15ba5c1d-ac0e-3943-818a-4b00424fd31e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "15ba5c1d-ac0e-3943-818a-4b00424fd31e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "84e62f79-25d2-4f80-ae36-07b279cbbee6"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-07-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:07:10.286630+00:00, try_number=1, job_id=903, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-20 00:00:00+00:00 +INFO - Started process 7519 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-07-20T00:00:00+00:00', '--job-id', '903', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp1p7ea3qt'] +INFO - Job 903: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010711Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010711Z +20221111/us-east-1/s3/aws4_request +d9e8134016b08865a2317a96e34cdc924d256b89df7e6d65d11d0bfd4a2a2c79 +INFO - '2022-11-11' - botocore.auth - Signature: +83e7917d2166ccb1875e322afeaead720a4311bf1abf657c2028c20eebdb74cb +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '8Mirlx0BM4RfqzRjAPX6UG9XjMPSTk7yCSKSAbvj6rL1yslot9dvMT1DSj3RU2APcr5hxQEqiTU=', 'x-amz-request-id': 'GAS7TETKTYY5Y4MW', 'Date': 'Fri, 11 Nov 2022 01:07:12 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180720T000000, start_date=20221111T010710, end_date=20221111T010712 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-07-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:07:12.974782Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "84e62f79-25d2-4f80-ae36-07b279cbbee6"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..b504a219 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:07:04.946205Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "15ba5c1d-ac0e-3943-818a-4b00424fd31e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "15ba5c1d-ac0e-3943-818a-4b00424fd31e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "df46940b-6c30-4ffb-9954-70ef927a9481"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-07-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:07:04.946205+00:00, try_number=1, job_id=901, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-20 00:00:00+00:00 +INFO - Started process 7557 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-07-20T00:00:00+00:00', '--job-id', '901', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpx50j5di1'] +INFO - Job 901: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180720T000000, start_date=20221111T010704, end_date=20221111T010708 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-07-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:07:08.650229Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "df46940b-6c30-4ffb-9954-70ef927a9481"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..14d73c40 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:07:04.938110Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "15ba5c1d-ac0e-3943-818a-4b00424fd31e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "15ba5c1d-ac0e-3943-818a-4b00424fd31e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0d9c581d-a32b-483c-93cb-0f99d02cd6ae"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-07-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:07:04.938110+00:00, try_number=1, job_id=902, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-20 00:00:00+00:00 +INFO - Started process 7556 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-07-20T00:00:00+00:00', '--job-id', '902', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpxp10g9uu'] +INFO - Job 902: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180720T000000, start_date=20221111T010704, end_date=20221111T010707 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-07-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:07:07.892656Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0d9c581d-a32b-483c-93cb-0f99d02cd6ae"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..97eea7af --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:07:15.984793Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dcc914b5-4b6a-37e0-bfc9-a8e11e06ae00"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dcc914b5-4b6a-37e0-bfc9-a8e11e06ae00"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "51f95e6b-c639-41d7-9682-2f8b7da65ac9"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-07-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:07:15.984793+00:00, try_number=1, job_id=906, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-21 00:00:00+00:00 +INFO - Started process 7549 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-07-21T00:00:00+00:00', '--job-id', '906', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpmm6bfbkv'] +INFO - Job 906: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180721T000000, start_date=20221111T010715, end_date=20221111T010719 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-07-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:07:19.269034Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "51f95e6b-c639-41d7-9682-2f8b7da65ac9"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..2efc1d56 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:07:15.984902Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dcc914b5-4b6a-37e0-bfc9-a8e11e06ae00"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dcc914b5-4b6a-37e0-bfc9-a8e11e06ae00"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1e3736a3-593e-4ea8-bf36-ab7878f6e779"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-07-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:07:15.984902+00:00, try_number=1, job_id=905, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-21 00:00:00+00:00 +INFO - Started process 7547 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-07-21T00:00:00+00:00', '--job-id', '905', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpfztn7uhc'] +INFO - Job 905: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180721T000000, start_date=20221111T010715, end_date=20221111T010720 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-07-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:07:20.056337Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1e3736a3-593e-4ea8-bf36-ab7878f6e779"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..46bc9521 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:07:27.093093Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dcc914b5-4b6a-37e0-bfc9-a8e11e06ae00"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dcc914b5-4b6a-37e0-bfc9-a8e11e06ae00"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ca8cd818-003e-418a-a451-6ee3c31c4e2a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-07-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:07:27.093093+00:00, try_number=1, job_id=910, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-21 00:00:00+00:00 +INFO - Started process 7564 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-07-21T00:00:00+00:00', '--job-id', '910', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpllk3usqq'] +INFO - Job 910: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498eeca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'AGl41POaq4lYXPswO8OH4A==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:AGl41POaq4lYXPswO8OH4A== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010727Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010727Z +20221111/us-east-1/s3/aws4_request +39e53eca3d19e5601fc4d670430a0e918dc875818071f892ce4cc8f33ab5c41b +INFO - '2022-11-11' - botocore.auth - Signature: +291674323baad6d8d571876f56f9b5510a6704b5df19ce729811d83945b157af +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'CDar2XYg3uHyMvrpegwRJDAOBqz5jh8w4IMx2kLw5uhAbSTdjmgOViyU1JqQmppuob1Jz7BxXSIk0QncoUQjvQ==', 'x-amz-request-id': 'RGHJSMFEY374EF2T', 'Date': 'Fri, 11 Nov 2022 01:07:28 GMT', 'ETag': '"006978d4f39aab89585cfb303bc387e0"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180721T000000, start_date=20221111T010727, end_date=20221111T010729 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-07-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:07:29.168363Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ca8cd818-003e-418a-a451-6ee3c31c4e2a"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..9e42bdf2 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:07:27.081433Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dcc914b5-4b6a-37e0-bfc9-a8e11e06ae00"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dcc914b5-4b6a-37e0-bfc9-a8e11e06ae00"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "dbe47ecf-7800-46c4-b7c1-d751b591b67e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-07-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:07:27.081433+00:00, try_number=1, job_id=909, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-21 00:00:00+00:00 +INFO - Started process 7563 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-07-21T00:00:00+00:00', '--job-id', '909', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp80nkm6k9'] +INFO - Job 909: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498eeca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010727Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010727Z +20221111/us-east-1/s3/aws4_request +811d64c35ce342d7751039e517da8a41476b6538bf50be5abf3f9bd5852ebcd6 +INFO - '2022-11-11' - botocore.auth - Signature: +5df99fa660874deb830db786d2db449e57f82aa48e396923e92200739b6de933 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'BQr8avrfeB8lHAptS7eAS6IplFh/3UJWakRCul1+SJXa71Egb+NJxGgeITKrT04KcY6k3e1+m5kwn3eAYina2w==', 'x-amz-request-id': 'RGHMECJXR5J8PBJS', 'Date': 'Fri, 11 Nov 2022 01:07:28 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180721T000000, start_date=20221111T010727, end_date=20221111T010729 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-07-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:07:29.177484Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "dbe47ecf-7800-46c4-b7c1-d751b591b67e"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..8308c65c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:07:20.856756Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dcc914b5-4b6a-37e0-bfc9-a8e11e06ae00"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dcc914b5-4b6a-37e0-bfc9-a8e11e06ae00"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1718ff2a-eb7c-4dae-a306-c075d3bd5bb1"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-07-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:07:20.856756+00:00, try_number=1, job_id=907, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-21 00:00:00+00:00 +INFO - Started process 7635 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-07-21T00:00:00+00:00', '--job-id', '907', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmps0mts893'] +INFO - Job 907: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180721T000000, start_date=20221111T010720, end_date=20221111T010725 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-07-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:07:25.183520Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1718ff2a-eb7c-4dae-a306-c075d3bd5bb1"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..33f73f7b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:07:22.010399Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dcc914b5-4b6a-37e0-bfc9-a8e11e06ae00"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "dcc914b5-4b6a-37e0-bfc9-a8e11e06ae00"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2335ca8f-e44c-42fd-9b9d-71696b4d1151"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-07-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:07:22.010399+00:00, try_number=1, job_id=908, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-21 00:00:00+00:00 +INFO - Started process 7555 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-07-21T00:00:00+00:00', '--job-id', '908', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpscp67ytr'] +INFO - Job 908: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180721T000000, start_date=20221111T010722, end_date=20221111T010724 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-07-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:07:24.967402Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2335ca8f-e44c-42fd-9b9d-71696b4d1151"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..b5b57264 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:07:32.199144Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "19a0c017-f20b-3bc3-9c27-473480dcaa85"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "19a0c017-f20b-3bc3-9c27-473480dcaa85"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1329870f-7108-4b1a-bb4b-d011c64d9da7"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-07-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:07:32.199144+00:00, try_number=1, job_id=912, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-22 00:00:00+00:00 +INFO - Started process 7644 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-07-22T00:00:00+00:00', '--job-id', '912', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpb4tqbc8j'] +INFO - Job 912: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180722T000000, start_date=20221111T010732, end_date=20221111T010735 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-07-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:07:35.525944Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1329870f-7108-4b1a-bb4b-d011c64d9da7"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..0c11bea8 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:07:32.170025Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "19a0c017-f20b-3bc3-9c27-473480dcaa85"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "19a0c017-f20b-3bc3-9c27-473480dcaa85"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6006ea52-a7b2-45c6-9f5c-c097332e76f8"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-07-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:07:32.170025+00:00, try_number=1, job_id=911, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-22 00:00:00+00:00 +INFO - Started process 7641 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-07-22T00:00:00+00:00', '--job-id', '911', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpn_xrls5c'] +INFO - Job 911: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180722T000000, start_date=20221111T010732, end_date=20221111T010735 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-07-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:07:35.526478Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6006ea52-a7b2-45c6-9f5c-c097332e76f8"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..bb9bed26 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:07:45.830547Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "19a0c017-f20b-3bc3-9c27-473480dcaa85"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "19a0c017-f20b-3bc3-9c27-473480dcaa85"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "addf1d7b-8ef7-44aa-8653-b5f002df90ec"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-07-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:07:45.830547+00:00, try_number=1, job_id=916, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-22 00:00:00+00:00 +INFO - Started process 7649 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-07-22T00:00:00+00:00', '--job-id', '916', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpl0aev2fn'] +INFO - Job 916: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498efca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '3++jheH+Ezx4hAso53Q74Q==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:3++jheH+Ezx4hAso53Q74Q== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010746Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010746Z +20221111/us-east-1/s3/aws4_request +f4798815070c23aec741c67aa45047ef474675074396236efb1c19d5cc021578 +INFO - '2022-11-11' - botocore.auth - Signature: +61e0d4ee8c336b2803d3ec61271613d0c5ac62dab9e06d901dbcb3b478b5d17e +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'XcgLXCe8s0cXYyyk6YqlIPEeEd+WMvwKO+T11zStHIk/kZc0HivYhqwiPV7tphEOxiRk0OEHoxs=', 'x-amz-request-id': 'XY8NABSSJH3R24MA', 'Date': 'Fri, 11 Nov 2022 01:07:47 GMT', 'ETag': '"dfefa385e1fe133c78840b28e7743be1"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180722T000000, start_date=20221111T010745, end_date=20221111T010747 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-07-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:07:47.941477Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "addf1d7b-8ef7-44aa-8653-b5f002df90ec"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..018199ef --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:07:43.375646Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "19a0c017-f20b-3bc3-9c27-473480dcaa85"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "19a0c017-f20b-3bc3-9c27-473480dcaa85"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4d4e3902-9351-4808-87ba-a61625ebb02c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-07-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:07:43.375646+00:00, try_number=1, job_id=915, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-22 00:00:00+00:00 +INFO - Started process 7670 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-07-22T00:00:00+00:00', '--job-id', '915', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpl8_fxscq'] +INFO - Job 915: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50041f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010744Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010744Z +20221111/us-east-1/s3/aws4_request +d5584f23690d536798c3d1fe3ec3a5dfecf60b0ff10a2bd1aa7d018d7d8993e4 +INFO - '2022-11-11' - botocore.auth - Signature: +17cbde2e47007398bc56ae4b108fe1bf1e0f12d7c90f9102311a273d60f7109d +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'NjPN8HhhsALaWOU2kj6c4WmyOFscTzYw9HBq0RMhwesqoaE9PORp0vrTzl/T5qnitXfoMPPrAK0=', 'x-amz-request-id': 'C4JGX0CCBWS3JJ33', 'Date': 'Fri, 11 Nov 2022 01:07:45 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180722T000000, start_date=20221111T010743, end_date=20221111T010746 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-07-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:07:46.054398Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4d4e3902-9351-4808-87ba-a61625ebb02c"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..da1fd9d2 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:07:37.233738Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "19a0c017-f20b-3bc3-9c27-473480dcaa85"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "19a0c017-f20b-3bc3-9c27-473480dcaa85"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a5b78ee3-bae3-4f35-ab94-15de7eac4e56"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-07-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:07:37.233738+00:00, try_number=1, job_id=913, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-22 00:00:00+00:00 +INFO - Started process 7576 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-07-22T00:00:00+00:00', '--job-id', '913', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpuvj4wvw7'] +INFO - Job 913: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180722T000000, start_date=20221111T010737, end_date=20221111T010743 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-07-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:07:43.513244Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a5b78ee3-bae3-4f35-ab94-15de7eac4e56"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..3f9e14ec --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:07:37.301374Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "19a0c017-f20b-3bc3-9c27-473480dcaa85"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "19a0c017-f20b-3bc3-9c27-473480dcaa85"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8d99a7e4-8d19-40d9-b757-5dcb32bac9df"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-07-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:07:37.301374+00:00, try_number=1, job_id=914, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-22 00:00:00+00:00 +INFO - Started process 7578 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-07-22T00:00:00+00:00', '--job-id', '914', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpbyh6r35v'] +INFO - Job 914: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180722T000000, start_date=20221111T010737, end_date=20221111T010740 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-07-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:07:40.159413Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8d99a7e4-8d19-40d9-b757-5dcb32bac9df"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..afff4e4f --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:07:50.328968Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9f48878b-8324-3911-b7c5-0b373192747a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9f48878b-8324-3911-b7c5-0b373192747a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a6df9fce-d6ff-45e1-91df-233eb41a8aae"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-07-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:07:50.328968+00:00, try_number=1, job_id=918, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-23 00:00:00+00:00 +INFO - Started process 7726 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-07-23T00:00:00+00:00', '--job-id', '918', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpz7_3yypp'] +INFO - Job 918: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-23T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180723T000000, start_date=20221111T010750, end_date=20221111T010753 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-07-23T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:07:53.875332Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a6df9fce-d6ff-45e1-91df-233eb41a8aae"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..69d40a36 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:07:50.293754Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9f48878b-8324-3911-b7c5-0b373192747a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9f48878b-8324-3911-b7c5-0b373192747a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c7d4b741-7b47-4ccd-b391-94d79219d535"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-07-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:07:50.293754+00:00, try_number=1, job_id=917, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-23 00:00:00+00:00 +INFO - Started process 7724 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-07-23T00:00:00+00:00', '--job-id', '917', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp75r_299_'] +INFO - Job 917: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-23T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180723T000000, start_date=20221111T010750, end_date=20221111T010753 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-07-23T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:07:53.898566Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c7d4b741-7b47-4ccd-b391-94d79219d535"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..9f3444ba --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:08:03.040066Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9f48878b-8324-3911-b7c5-0b373192747a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9f48878b-8324-3911-b7c5-0b373192747a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8a13e03d-b861-4df9-a21c-3bf55b64706c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-07-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:08:03.040066+00:00, try_number=1, job_id=922, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-23 00:00:00+00:00 +INFO - Started process 7749 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-07-23T00:00:00+00:00', '--job-id', '922', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpwyoxj4vz'] +INFO - Job 922: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-23T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'lLS5C+2P/8C/YWUh0QcKzQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:lLS5C+2P/8C/YWUh0QcKzQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010803Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010803Z +20221111/us-east-1/s3/aws4_request +440fea0633ed7b24b183604a08570025c793e837dab4e2b03460650ef2f68cc5 +INFO - '2022-11-11' - botocore.auth - Signature: +8438fb8d4039167d9105bfc9b9e52b005d2c424f9eb5504797da39c8232e9509 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'rNjzDh4JW6zPiTIflL5vekISgvXeqPUQCiW3jjR9zGZ5rTWrYb3fMKIzoGytJI5lBRDnmiRqWC0=', 'x-amz-request-id': 'H3G283EGHFC2G6T9', 'Date': 'Fri, 11 Nov 2022 01:08:04 GMT', 'ETag': '"94b4b90bed8fffc0bf616521d1070acd"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180723T000000, start_date=20221111T010803, end_date=20221111T010804 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-07-23T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:08:04.962395Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8a13e03d-b861-4df9-a21c-3bf55b64706c"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..4e6cdef1 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:08:00.586668Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9f48878b-8324-3911-b7c5-0b373192747a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9f48878b-8324-3911-b7c5-0b373192747a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1ca07c14-01f9-44a2-9b64-dbaee772709b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-07-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:08:00.586668+00:00, try_number=1, job_id=921, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-23 00:00:00+00:00 +INFO - Started process 7741 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-07-23T00:00:00+00:00', '--job-id', '921', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp7vfmmo6w'] +INFO - Job 921: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-23T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50083a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010801Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010801Z +20221111/us-east-1/s3/aws4_request +a19390f1ff74f64f99e46c5e4fd271e1da45ed8f674812ed98e74f5fef243cee +INFO - '2022-11-11' - botocore.auth - Signature: +b21dc53c6f478ce58827237f1f1cacbbb7f0e22592ced1bdf3516b02cc77613b +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'xhK1hBa8S+1k8LTQj6VPNulpGdcrk4FWgod1TycWQRLAOSGhgB7C8S5wIry2NHwCG9i0QibrFlc=', 'x-amz-request-id': 'PR57MSG8HWHS64SM', 'Date': 'Fri, 11 Nov 2022 01:08:02 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180723T000000, start_date=20221111T010800, end_date=20221111T010803 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-07-23T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:08:03.126406Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1ca07c14-01f9-44a2-9b64-dbaee772709b"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..64c90826 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:07:55.520680Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9f48878b-8324-3911-b7c5-0b373192747a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9f48878b-8324-3911-b7c5-0b373192747a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "78c24b7c-eeae-48b6-b45c-0ea5546b0e61"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-07-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:07:55.520680+00:00, try_number=1, job_id=920, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-23 00:00:00+00:00 +INFO - Started process 7736 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-07-23T00:00:00+00:00', '--job-id', '920', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp15te2oon'] +INFO - Job 920: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-23T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180723T000000, start_date=20221111T010755, end_date=20221111T010801 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-07-23T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:08:01.487383Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "78c24b7c-eeae-48b6-b45c-0ea5546b0e61"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..cad7f88e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:07:55.503955Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9f48878b-8324-3911-b7c5-0b373192747a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9f48878b-8324-3911-b7c5-0b373192747a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ed319014-2479-4776-ad4e-59e546830901"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-07-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:07:55.503955+00:00, try_number=1, job_id=919, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-23 00:00:00+00:00 +INFO - Started process 7734 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-07-23T00:00:00+00:00', '--job-id', '919', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp899l0d5_'] +INFO - Job 919: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-23T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180723T000000, start_date=20221111T010755, end_date=20221111T010758 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-07-23T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:07:58.306470Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ed319014-2479-4776-ad4e-59e546830901"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..a631282c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:08:07.254063Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b083b700-b733-3b21-a404-e9935dc64020"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b083b700-b733-3b21-a404-e9935dc64020"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1a0d3a4a-ec32-4537-bbd9-90052fef00c8"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-07-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:08:07.254063+00:00, try_number=1, job_id=923, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-24 00:00:00+00:00 +INFO - Started process 7758 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-07-24T00:00:00+00:00', '--job-id', '923', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpja4i0v6y'] +INFO - Job 923: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-24T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180724T000000, start_date=20221111T010807, end_date=20221111T010810 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-07-24T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:08:10.724810Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1a0d3a4a-ec32-4537-bbd9-90052fef00c8"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..65b11508 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:08:07.323133Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b083b700-b733-3b21-a404-e9935dc64020"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b083b700-b733-3b21-a404-e9935dc64020"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "187a63c3-0dac-4a46-8e7a-3d4276d461a3"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-07-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:08:07.323133+00:00, try_number=1, job_id=924, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-24 00:00:00+00:00 +INFO - Started process 7760 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-07-24T00:00:00+00:00', '--job-id', '924', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp3ngxa9v4'] +INFO - Job 924: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-24T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180724T000000, start_date=20221111T010807, end_date=20221111T010810 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-07-24T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:08:10.734427Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "187a63c3-0dac-4a46-8e7a-3d4276d461a3"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..63e68711 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:08:23.295905Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b083b700-b733-3b21-a404-e9935dc64020"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b083b700-b733-3b21-a404-e9935dc64020"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "06d425b6-0c38-41e3-801c-7cb12d6a6380"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-07-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:08:23.295905+00:00, try_number=1, job_id=928, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-24 00:00:00+00:00 +INFO - Started process 7831 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-07-24T00:00:00+00:00', '--job-id', '928', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpfwkyazrl'] +INFO - Job 928: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-24T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'lLS5C+2P/8C/YWUh0QcKzQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:lLS5C+2P/8C/YWUh0QcKzQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010824Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010824Z +20221111/us-east-1/s3/aws4_request +00fad497036f359ec3424a30b30df06f2a3653b6641de30ee2e20458d4945a79 +INFO - '2022-11-11' - botocore.auth - Signature: +4c1a448c361f2a3419ac4eaa8619e121bdf4a04f228b58d62628ca9d34f39dcc +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'w12MgTtUowW6SIDa7UB0dRg4zyNGWvw+S4IQqJHgvXXULpSL2b08FuNbXpke/haXrbggBcHvURQ=', 'x-amz-request-id': 'VF0YY2ZWBD8DJQE1', 'Date': 'Fri, 11 Nov 2022 01:08:24 GMT', 'ETag': '"94b4b90bed8fffc0bf616521d1070acd"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180724T000000, start_date=20221111T010823, end_date=20221111T010825 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-07-24T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:08:25.471935Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "06d425b6-0c38-41e3-801c-7cb12d6a6380"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..63fcecb8 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:08:19.412630Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b083b700-b733-3b21-a404-e9935dc64020"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b083b700-b733-3b21-a404-e9935dc64020"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "76ded1cb-32ee-42eb-bb7f-0e18979de8b6"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-07-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:08:19.412630+00:00, try_number=1, job_id=927, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-24 00:00:00+00:00 +INFO - Started process 7730 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-07-24T00:00:00+00:00', '--job-id', '927', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpr8qyy640'] +INFO - Job 927: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-24T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499523a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010820Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010820Z +20221111/us-east-1/s3/aws4_request +d66eb7cbb20f346e575a2f25eda239c6a98ac6f7c889197eb535e721b6ce37b8 +INFO - '2022-11-11' - botocore.auth - Signature: +ea27da18bf426b1a7ae065e31aac75289b900f363fa02d534cfa51572d3f8d10 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'AQGlGiDYDqZgI7gphCuAxY1IFNZIi96pk0nMgJswIJZBwPFCCpOpvWikE8724/2kAjKbivDtOW4=', 'x-amz-request-id': '56W617ACGN38WWHT', 'Date': 'Fri, 11 Nov 2022 01:08:21 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180724T000000, start_date=20221111T010819, end_date=20221111T010821 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-07-24T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:08:21.965598Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "76ded1cb-32ee-42eb-bb7f-0e18979de8b6"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..a793d84e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:08:12.576702Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b083b700-b733-3b21-a404-e9935dc64020"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b083b700-b733-3b21-a404-e9935dc64020"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "99064f07-6262-402b-bc6e-a3a63b304d13"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-07-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:08:12.576702+00:00, try_number=1, job_id=925, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-24 00:00:00+00:00 +INFO - Started process 7694 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-07-24T00:00:00+00:00', '--job-id', '925', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpvczr36_i'] +INFO - Job 925: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-24T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180724T000000, start_date=20221111T010812, end_date=20221111T010820 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-07-24T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:08:20.945921Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "99064f07-6262-402b-bc6e-a3a63b304d13"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..9c0d1915 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:08:12.677718Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b083b700-b733-3b21-a404-e9935dc64020"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b083b700-b733-3b21-a404-e9935dc64020"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a53cfa5b-e154-4af0-acda-3498b693df03"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-07-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:08:12.677718+00:00, try_number=1, job_id=926, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-24 00:00:00+00:00 +INFO - Started process 7696 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-07-24T00:00:00+00:00', '--job-id', '926', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpz657_65o'] +INFO - Job 926: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-24T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180724T000000, start_date=20221111T010812, end_date=20221111T010815 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-07-24T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:08:15.985721Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a53cfa5b-e154-4af0-acda-3498b693df03"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..9d848a5e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:08:28.142312Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bf683584-1f21-38df-b2d7-466bddb98401"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bf683584-1f21-38df-b2d7-466bddb98401"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fd551ddf-938a-4929-94c6-937b1ea1940f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-07-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:08:28.142312+00:00, try_number=1, job_id=930, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-25 00:00:00+00:00 +INFO - Started process 7742 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-07-25T00:00:00+00:00', '--job-id', '930', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmptq1o3dpm'] +INFO - Job 930: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-25T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180725T000000, start_date=20221111T010828, end_date=20221111T010831 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-07-25T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:08:31.147683Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fd551ddf-938a-4929-94c6-937b1ea1940f"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..ca1d5445 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:08:28.139050Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bf683584-1f21-38df-b2d7-466bddb98401"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bf683584-1f21-38df-b2d7-466bddb98401"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f98666a1-41df-4346-a4e5-bd12d4d4a80f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-07-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:08:28.139050+00:00, try_number=1, job_id=929, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-25 00:00:00+00:00 +INFO - Started process 7740 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-07-25T00:00:00+00:00', '--job-id', '929', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpgxtp3zvy'] +INFO - Job 929: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-25T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180725T000000, start_date=20221111T010828, end_date=20221111T010831 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-07-25T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:08:31.152052Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f98666a1-41df-4346-a4e5-bd12d4d4a80f"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..4cff25f1 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:08:42.390610Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bf683584-1f21-38df-b2d7-466bddb98401"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bf683584-1f21-38df-b2d7-466bddb98401"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9d1a246b-856a-4df2-914c-544d3749b792"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-07-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:08:42.390610+00:00, try_number=1, job_id=934, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-25 00:00:00+00:00 +INFO - Started process 7771 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-07-25T00:00:00+00:00', '--job-id', '934', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpqch453px'] +INFO - Job 934: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-25T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498eff70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'oQdASIYPudU1kO3hK50Acg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:oQdASIYPudU1kO3hK50Acg== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010843Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010843Z +20221111/us-east-1/s3/aws4_request +61e1ebddd494e9b8ec727f624f2cd137015ca944078c9e0f70669f65b752b1d6 +INFO - '2022-11-11' - botocore.auth - Signature: +b6a89090de1e35acb781a9c7e88f1041d6465789d5ac2d8b28f3a4d15644d63e +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'iklrP3yj3ilehvM21lC5IAo4yTZF59mh2O/MkVX0UWxAoKH4NJMOmXrwpG19FqlXZ0spoUneeu4=', 'x-amz-request-id': '1P4QSVTCDBQ6DCHQ', 'Date': 'Fri, 11 Nov 2022 01:08:43 GMT', 'ETag': '"a1074048860fb9d53590ede12b9d0072"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180725T000000, start_date=20221111T010842, end_date=20221111T010844 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-07-25T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:08:44.266437Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9d1a246b-856a-4df2-914c-544d3749b792"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..f51511e8 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:08:38.104662Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bf683584-1f21-38df-b2d7-466bddb98401"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bf683584-1f21-38df-b2d7-466bddb98401"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e5c82210-c8cd-451c-8693-e55ad61bdd28"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-07-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:08:38.104662+00:00, try_number=1, job_id=933, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-25 00:00:00+00:00 +INFO - Started process 7847 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-07-25T00:00:00+00:00', '--job-id', '933', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpxb9u2ltz'] +INFO - Job 933: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-25T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50043a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010839Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010839Z +20221111/us-east-1/s3/aws4_request +6e95b5d68fb2a96f893c1012140ab6d862e203ac1328eb521c8d19013354d2c3 +INFO - '2022-11-11' - botocore.auth - Signature: +385e540f56c4e9ad8ec801042d71ed5c41b28aa7166da9e8eea6c1bb12993998 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'qmjOPZ957+LiER37SPzL8yjQqU7qU8WDanr527Gk+NwJOJCWA6Gwd1S+9FyLx0h5QixkJPVOzA4=', 'x-amz-request-id': 'J86WXCJDXAKV4SVH', 'Date': 'Fri, 11 Nov 2022 01:08:39 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180725T000000, start_date=20221111T010838, end_date=20221111T010840 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-07-25T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:08:40.189918Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e5c82210-c8cd-451c-8693-e55ad61bdd28"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..4d646c2b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:08:32.956950Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bf683584-1f21-38df-b2d7-466bddb98401"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bf683584-1f21-38df-b2d7-466bddb98401"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "74246d06-5414-4d7c-afad-4b160fe3034e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-07-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:08:32.956950+00:00, try_number=1, job_id=932, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-25 00:00:00+00:00 +INFO - Started process 7842 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-07-25T00:00:00+00:00', '--job-id', '932', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpy3u3300f'] +INFO - Job 932: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-25T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180725T000000, start_date=20221111T010832, end_date=20221111T010840 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-07-25T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:08:40.805487Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "74246d06-5414-4d7c-afad-4b160fe3034e"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..da97483f --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:08:32.913133Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bf683584-1f21-38df-b2d7-466bddb98401"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "bf683584-1f21-38df-b2d7-466bddb98401"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5d3ee5c7-2169-401b-9868-a459c7bc4cc3"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-07-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:08:32.913133+00:00, try_number=1, job_id=931, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-25 00:00:00+00:00 +INFO - Started process 7840 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-07-25T00:00:00+00:00', '--job-id', '931', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp01jdqe_d'] +INFO - Job 931: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-25T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180725T000000, start_date=20221111T010832, end_date=20221111T010836 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-07-25T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:08:36.389247Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5d3ee5c7-2169-401b-9868-a459c7bc4cc3"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..40b8560b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:08:47.682849Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6061ef3a-ca04-3aa7-b2f7-fb2c65794ec5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6061ef3a-ca04-3aa7-b2f7-fb2c65794ec5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b171efb3-8022-40b0-9ccd-39956792d904"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-07-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:08:47.682849+00:00, try_number=1, job_id=936, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-26 00:00:00+00:00 +INFO - Started process 7824 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-07-26T00:00:00+00:00', '--job-id', '936', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpke5iaxsb'] +INFO - Job 936: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-26T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180726T000000, start_date=20221111T010847, end_date=20221111T010851 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-07-26T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:08:51.063162Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b171efb3-8022-40b0-9ccd-39956792d904"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..8b572ddf --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:08:47.668027Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6061ef3a-ca04-3aa7-b2f7-fb2c65794ec5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6061ef3a-ca04-3aa7-b2f7-fb2c65794ec5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bc796ae1-4bf6-4e9a-b6ad-eb0b9329ee39"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-07-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:08:47.668027+00:00, try_number=1, job_id=935, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-26 00:00:00+00:00 +INFO - Started process 7821 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-07-26T00:00:00+00:00', '--job-id', '935', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp1iedepcc'] +INFO - Job 935: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-26T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180726T000000, start_date=20221111T010847, end_date=20221111T010851 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-07-26T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:08:51.061696Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bc796ae1-4bf6-4e9a-b6ad-eb0b9329ee39"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..8c699305 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:09:01.837601Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6061ef3a-ca04-3aa7-b2f7-fb2c65794ec5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6061ef3a-ca04-3aa7-b2f7-fb2c65794ec5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c31b770e-dc88-426a-8c5e-7563a091a61c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-07-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:09:01.837601+00:00, try_number=1, job_id=940, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-26 00:00:00+00:00 +INFO - Started process 7927 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-07-26T00:00:00+00:00', '--job-id', '940', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpv5b_e_h4'] +INFO - Job 940: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-26T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'pUCEOiMKJNt8lTYqoMkrIA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:pUCEOiMKJNt8lTYqoMkrIA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010902Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010902Z +20221111/us-east-1/s3/aws4_request +db4acc13abe1656ca85e7d70b0b052742caae464bc64525b49c47a2712656b8d +INFO - '2022-11-11' - botocore.auth - Signature: +4124ef62ebb579d1671cc146eb7ad03e9c5798c1594f7ee27ae4cc901625328f +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '6Jch0uxQHLvr32hteGy3hogBGmuwMhhUdVqD0t5cyY9wOAkGMsTJRgdO15gonZiB7w+1Yf056j0=', 'x-amz-request-id': 'ZEQ34XDD05MHZXTE', 'Date': 'Fri, 11 Nov 2022 01:09:03 GMT', 'ETag': '"a540843a230a24db7c95362aa0c92b20"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180726T000000, start_date=20221111T010901, end_date=20221111T010904 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-07-26T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:09:04.025758Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c31b770e-dc88-426a-8c5e-7563a091a61c"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..1fd5ceab --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:08:58.447876Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6061ef3a-ca04-3aa7-b2f7-fb2c65794ec5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6061ef3a-ca04-3aa7-b2f7-fb2c65794ec5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "93463f50-cb14-4bc7-a3d5-65bb7c9919a2"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-07-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:08:58.447876+00:00, try_number=1, job_id=939, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-26 00:00:00+00:00 +INFO - Started process 7920 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-07-26T00:00:00+00:00', '--job-id', '939', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp94tkj_69'] +INFO - Job 939: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-26T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50063a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010859Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010859Z +20221111/us-east-1/s3/aws4_request +3146319ac8f9d8a1df6ebeed73bfc51ab3943f296d144be17881aaa03122d6ba +INFO - '2022-11-11' - botocore.auth - Signature: +f9492af7455fab9ff5a14f621646c3c0a0c4bc0f6f60c2dae2d84704a04fca66 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'Jv0sfx9MAmgR0uukEdBUA0p4qJlKmvEn3iE+DnOoY0PTxCne7SR5OHCOQm7eqNb0gHeNfE5W1A8=', 'x-amz-request-id': 'QVEGR5CXERZSKEVT', 'Date': 'Fri, 11 Nov 2022 01:09:00 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180726T000000, start_date=20221111T010858, end_date=20221111T010901 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-07-26T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:09:01.088315Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "93463f50-cb14-4bc7-a3d5-65bb7c9919a2"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..11fc9559 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:08:53.517828Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6061ef3a-ca04-3aa7-b2f7-fb2c65794ec5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6061ef3a-ca04-3aa7-b2f7-fb2c65794ec5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8b82e95f-1ab8-4dce-8853-474a2523921b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-07-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:08:53.517828+00:00, try_number=1, job_id=938, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-26 00:00:00+00:00 +INFO - Started process 7834 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-07-26T00:00:00+00:00', '--job-id', '938', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpbfftq0yy'] +INFO - Job 938: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-26T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180726T000000, start_date=20221111T010853, end_date=20221111T010859 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-07-26T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:08:59.559348Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8b82e95f-1ab8-4dce-8853-474a2523921b"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..0111f67a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:08:53.515219Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6061ef3a-ca04-3aa7-b2f7-fb2c65794ec5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "6061ef3a-ca04-3aa7-b2f7-fb2c65794ec5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c352a4c7-0ded-43e6-a47b-dd86b0fe07d6"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-07-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:08:53.515219+00:00, try_number=1, job_id=937, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-26 00:00:00+00:00 +INFO - Started process 7832 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-07-26T00:00:00+00:00', '--job-id', '937', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpfzpc5m0v'] +INFO - Job 937: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-26T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180726T000000, start_date=20221111T010853, end_date=20221111T010856 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-07-26T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:08:56.917580Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c352a4c7-0ded-43e6-a47b-dd86b0fe07d6"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..0d7ecfcf --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:09:06.305548Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ea807fe5-2dc9-3fc6-a005-865dc1dd5da6"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ea807fe5-2dc9-3fc6-a005-865dc1dd5da6"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8f687220-346c-46c9-b3c4-5c0abb0b52cc"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-07-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:09:06.305548+00:00, try_number=1, job_id=941, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-27 00:00:00+00:00 +INFO - Started process 7935 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-07-27T00:00:00+00:00', '--job-id', '941', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpq7vyj6z9'] +INFO - Job 941: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-27T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180727T000000, start_date=20221111T010906, end_date=20221111T010909 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-07-27T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:09:09.759997Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8f687220-346c-46c9-b3c4-5c0abb0b52cc"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..d939544c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:09:06.560855Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ea807fe5-2dc9-3fc6-a005-865dc1dd5da6"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ea807fe5-2dc9-3fc6-a005-865dc1dd5da6"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "355e4935-b53c-4f13-be1e-dd2827694e60"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-07-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:09:06.560855+00:00, try_number=1, job_id=942, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-27 00:00:00+00:00 +INFO - Started process 7938 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-07-27T00:00:00+00:00', '--job-id', '942', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpuhi3hf0h'] +INFO - Job 942: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-27T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180727T000000, start_date=20221111T010906, end_date=20221111T010909 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-07-27T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:09:09.768946Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "355e4935-b53c-4f13-be1e-dd2827694e60"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..f093d343 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:09:23.065544Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ea807fe5-2dc9-3fc6-a005-865dc1dd5da6"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ea807fe5-2dc9-3fc6-a005-865dc1dd5da6"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0b3a808d-6d14-40f1-bd55-4c67f6505c78"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-07-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:09:23.065544+00:00, try_number=1, job_id=946, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-27 00:00:00+00:00 +INFO - Started process 8026 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-07-27T00:00:00+00:00', '--job-id', '946', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpkfm8fuua'] +INFO - Job 946: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-27T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6ca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'tnFhDAEKpyn2G6PeeLVEVQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:tnFhDAEKpyn2G6PeeLVEVQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010923Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010923Z +20221111/us-east-1/s3/aws4_request +8c0f69a56012d0a75c6c93db66dc84f549352c823c25a7174192033ab826ee4e +INFO - '2022-11-11' - botocore.auth - Signature: +42bd25909895cec771bfcbcef3df940f658ad10201cd53361a105f9b32c34546 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '8iGZq/A4EkvBPXGnFAm8ud7cvf3aUv8oUgiJjOwL5GJmW3zT3FmB5YqxHk+2c432Re63mXSwl84=', 'x-amz-request-id': 'ERX8CHB9C1QHFEY2', 'Date': 'Fri, 11 Nov 2022 01:09:24 GMT', 'ETag': '"b671610c010aa729f61ba3de78b54455"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180727T000000, start_date=20221111T010923, end_date=20221111T010924 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-07-27T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:09:24.868783Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0b3a808d-6d14-40f1-bd55-4c67f6505c78"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..25bfce57 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:09:18.760776Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ea807fe5-2dc9-3fc6-a005-865dc1dd5da6"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ea807fe5-2dc9-3fc6-a005-865dc1dd5da6"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "94ed27ea-9b0a-4cd0-a160-0b98ef2e74d7"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-07-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:09:18.760776+00:00, try_number=1, job_id=945, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-27 00:00:00+00:00 +INFO - Started process 7994 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-07-27T00:00:00+00:00', '--job-id', '945', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpjr8sz9sl'] +INFO - Job 945: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-27T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50093a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010920Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010920Z +20221111/us-east-1/s3/aws4_request +9e5bd7c9f1f1874d0e4b416b50a175d9635d464e5592beda4068610b1de02aef +INFO - '2022-11-11' - botocore.auth - Signature: +8b40dfb99e5a193d774df05e624c0e64c3c744c304cfc79e4476f9704fe9a732 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'iJNlkPdwf2DFD28GGR8P4nxailFoeBkHDEp/aj8NvvO7SaZYb7A077WNU0V58HvfLkMkK2grbCk=', 'x-amz-request-id': 'GDC0Z90SYBDXNFZQ', 'Date': 'Fri, 11 Nov 2022 01:09:21 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180727T000000, start_date=20221111T010918, end_date=20221111T010922 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-07-27T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:09:22.277261Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "94ed27ea-9b0a-4cd0-a160-0b98ef2e74d7"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..fdec67c8 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:09:12.067457Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ea807fe5-2dc9-3fc6-a005-865dc1dd5da6"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ea807fe5-2dc9-3fc6-a005-865dc1dd5da6"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b59cec6d-3d47-4544-b190-c0f914d3abec"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-07-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:09:12.067457+00:00, try_number=1, job_id=944, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-27 00:00:00+00:00 +INFO - Started process 7948 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-07-27T00:00:00+00:00', '--job-id', '944', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpl1r15vo7'] +INFO - Job 944: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-27T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180727T000000, start_date=20221111T010912, end_date=20221111T010920 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-07-27T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:09:20.919271Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b59cec6d-3d47-4544-b190-c0f914d3abec"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..780003c7 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:09:12.067243Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ea807fe5-2dc9-3fc6-a005-865dc1dd5da6"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ea807fe5-2dc9-3fc6-a005-865dc1dd5da6"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f8be9478-f279-4a74-8188-84bdf6369225"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-07-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:09:12.067243+00:00, try_number=1, job_id=943, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-27 00:00:00+00:00 +INFO - Started process 7947 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-07-27T00:00:00+00:00', '--job-id', '943', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmprno5k811'] +INFO - Job 943: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-27T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180727T000000, start_date=20221111T010912, end_date=20221111T010915 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-07-27T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:09:15.141647Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f8be9478-f279-4a74-8188-84bdf6369225"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..853e6821 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:09:27.704703Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "fde2cf62-0a7a-3470-bb72-e430281bc19d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "fde2cf62-0a7a-3470-bb72-e430281bc19d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "20c28772-e1d8-411f-8663-67a70c30460d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-07-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:09:27.704703+00:00, try_number=1, job_id=948, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-28 00:00:00+00:00 +INFO - Started process 7909 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-07-28T00:00:00+00:00', '--job-id', '948', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp_3ua9c_v'] +INFO - Job 948: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-28T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180728T000000, start_date=20221111T010927, end_date=20221111T010931 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-07-28T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:09:31.088232Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "20c28772-e1d8-411f-8663-67a70c30460d"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..716bebdb --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:09:27.646369Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "fde2cf62-0a7a-3470-bb72-e430281bc19d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "fde2cf62-0a7a-3470-bb72-e430281bc19d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8b971b43-0ba3-451e-9687-c022b524ceef"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-07-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:09:27.646369+00:00, try_number=1, job_id=947, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-28 00:00:00+00:00 +INFO - Started process 7906 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-07-28T00:00:00+00:00', '--job-id', '947', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpy5voony6'] +INFO - Job 947: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-28T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180728T000000, start_date=20221111T010927, end_date=20221111T010931 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-07-28T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:09:31.035372Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8b971b43-0ba3-451e-9687-c022b524ceef"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..226a484b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:09:42.085753Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "fde2cf62-0a7a-3470-bb72-e430281bc19d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "fde2cf62-0a7a-3470-bb72-e430281bc19d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f9f114af-0b83-43e4-9b31-93d1ce527b67"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-07-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:09:42.085753+00:00, try_number=1, job_id=952, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-28 00:00:00+00:00 +INFO - Started process 7928 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-07-28T00:00:00+00:00', '--job-id', '952', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpxsgy0a5g'] +INFO - Job 952: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-28T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0ca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '0XR6L7GzLwWSXsQUrd6aBg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:0XR6L7GzLwWSXsQUrd6aBg== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010942Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010942Z +20221111/us-east-1/s3/aws4_request +8ee412afb3633a4deac7762ed46fdb38ee6395e640918c73421a90542c2774c1 +INFO - '2022-11-11' - botocore.auth - Signature: +4c557b629da6b39e263bec8120f2e2254dfa23a0c064dc1129f5f372c6f0a9f0 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'GMT7jw2IONcMi8xqIl3yvpXcW1aGlKDXJWWiBJDbdUH9Fjq7iwIvP9XK8sWmfvFtn7rVv5CH8XY=', 'x-amz-request-id': 'T36KSQN6ASWABCNF', 'Date': 'Fri, 11 Nov 2022 01:09:43 GMT', 'ETag': '"d1747a2fb1b32f05925ec414adde9a06"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180728T000000, start_date=20221111T010942, end_date=20221111T010943 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-07-28T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:09:43.956479Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f9f114af-0b83-43e4-9b31-93d1ce527b67"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..704cef15 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:09:39.119455Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "fde2cf62-0a7a-3470-bb72-e430281bc19d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "fde2cf62-0a7a-3470-bb72-e430281bc19d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "57c3eaf5-0814-4963-a3dd-f0a019e74373"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-07-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:09:39.119455+00:00, try_number=1, job_id=951, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-28 00:00:00+00:00 +INFO - Started process 7915 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-07-28T00:00:00+00:00', '--job-id', '951', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmppjx19mw_'] +INFO - Job 951: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-28T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499523a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T010939Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T010939Z +20221111/us-east-1/s3/aws4_request +70b48b6be13951e4320e2ea492f4fe72c90e22480750d26c5a46a98a948697dc +INFO - '2022-11-11' - botocore.auth - Signature: +ee24897b41f907b0b0913bd9e4202df9d1f92667f5228ed3a32f7a7d5d24f519 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'CBUVRI+w9UtPT+KvsklCgiG9OgjbMjNE0wIGNLT8JLeOmrQpTEVmE+KSHk8lQU03tS4wFM3E/po=', 'x-amz-request-id': 'CGG4583RW35E5KV5', 'Date': 'Fri, 11 Nov 2022 01:09:40 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180728T000000, start_date=20221111T010939, end_date=20221111T010941 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-07-28T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:09:41.270665Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "57c3eaf5-0814-4963-a3dd-f0a019e74373"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..9ae01b9b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:09:33.308003Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "fde2cf62-0a7a-3470-bb72-e430281bc19d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "fde2cf62-0a7a-3470-bb72-e430281bc19d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cdd2152f-94be-4493-aa95-9a8e24debb65"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-07-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:09:33.308003+00:00, try_number=1, job_id=950, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-28 00:00:00+00:00 +INFO - Started process 8037 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-07-28T00:00:00+00:00', '--job-id', '950', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpa37qfodp'] +INFO - Job 950: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-28T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180728T000000, start_date=20221111T010933, end_date=20221111T010940 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-07-28T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:09:40.305230Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cdd2152f-94be-4493-aa95-9a8e24debb65"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..07466f99 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:09:33.269333Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "fde2cf62-0a7a-3470-bb72-e430281bc19d"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "fde2cf62-0a7a-3470-bb72-e430281bc19d"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "04fbe47d-cccd-4213-ba0e-182df9a6375c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-07-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:09:33.269333+00:00, try_number=1, job_id=949, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-28 00:00:00+00:00 +INFO - Started process 8035 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-07-28T00:00:00+00:00', '--job-id', '949', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpuv9_stmd'] +INFO - Job 949: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-28T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180728T000000, start_date=20221111T010933, end_date=20221111T010936 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-07-28T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:09:36.778386Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "04fbe47d-cccd-4213-ba0e-182df9a6375c"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..a83ca657 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:09:46.752567Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-29T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ab92932b-0032-31e5-b23d-e338b323cdbe"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ab92932b-0032-31e5-b23d-e338b323cdbe"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e60229e7-c549-47bf-a3c4-cb1542a41c5a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-07-29T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:09:46.752567+00:00, try_number=1, job_id=954, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-29 00:00:00+00:00 +INFO - Started process 7976 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-07-29T00:00:00+00:00', '--job-id', '954', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpo4cannhg'] +INFO - Job 954: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-29T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-29T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180729T000000, start_date=20221111T010946, end_date=20221111T010950 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-07-29T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:09:50.844056Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e60229e7-c549-47bf-a3c4-cb1542a41c5a"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..8b98ab0c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:09:46.740698Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-29T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ab92932b-0032-31e5-b23d-e338b323cdbe"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ab92932b-0032-31e5-b23d-e338b323cdbe"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "364b39eb-a77e-466a-9706-c559a07c6ea7"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-07-29T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:09:46.740698+00:00, try_number=1, job_id=953, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-29 00:00:00+00:00 +INFO - Started process 7968 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-07-29T00:00:00+00:00', '--job-id', '953', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpaed61dut'] +INFO - Job 953: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-29T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-29T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180729T000000, start_date=20221111T010946, end_date=20221111T010950 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-07-29T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:09:50.832253Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "364b39eb-a77e-466a-9706-c559a07c6ea7"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..18723289 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:10:05.234053Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-29T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ab92932b-0032-31e5-b23d-e338b323cdbe"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ab92932b-0032-31e5-b23d-e338b323cdbe"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e33e4599-235d-4936-a6c9-403fc135ca81"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-07-29T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:10:05.234053+00:00, try_number=1, job_id=958, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-29 00:00:00+00:00 +INFO - Started process 8115 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-07-29T00:00:00+00:00', '--job-id', '958', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpggdq7154'] +INFO - Job 958: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-29T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-29T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5ee0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'vbtSnSUVAKhAKM0HM3x8nA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:vbtSnSUVAKhAKM0HM3x8nA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011006Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011006Z +20221111/us-east-1/s3/aws4_request +2f02cdd6150d276e9eae2515cd47519ac1a1a1de49b9d42533e8b1158176f5b9 +INFO - '2022-11-11' - botocore.auth - Signature: +508930e7fe9cd51294f5c704b74730a0c6f77ec9c4a4610d7b56aa7fa476857b +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'Ndp1YI8b5Y7fNgUX9egVrvns/Xzn8OfR/cOXUiKb+nbz5eA3NgWwdmwzyRAk5Co72/B62E1MSoh8WLdfHyRSug==', 'x-amz-request-id': '0YZRWNF0AXRM9XS7', 'Date': 'Fri, 11 Nov 2022 01:10:07 GMT', 'ETag': '"bdbb529d251500a84028cd07337c7c9c"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180729T000000, start_date=20221111T011005, end_date=20221111T011007 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-07-29T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:10:07.945139Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e33e4599-235d-4936-a6c9-403fc135ca81"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..2475b291 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:10:01.769840Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-29T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ab92932b-0032-31e5-b23d-e338b323cdbe"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ab92932b-0032-31e5-b23d-e338b323cdbe"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a4c13757-e24a-4fdd-9ab5-6b35b6b0c4c8"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-07-29T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:10:01.769840+00:00, try_number=1, job_id=957, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-29 00:00:00+00:00 +INFO - Started process 8108 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-07-29T00:00:00+00:00', '--job-id', '957', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp0t3sfhu3'] +INFO - Job 957: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-29T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-29T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50071f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011002Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011002Z +20221111/us-east-1/s3/aws4_request +5cbb659658be03d41cd2be1c762a1b0f0f4b63b2bff1f2b9259656a1157f97fc +INFO - '2022-11-11' - botocore.auth - Signature: +13ab7aed269c73496bac7adffa8d0b476a778806922198df102ae92bf4acb682 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '4gvPpekeIqRP5S7yy+NkAkFTjZ12dkvuL8w1ICiyvstthkb0VYjNTu8F6crzhvjH9k24Xgb70CI=', 'x-amz-request-id': 'YXCBWZV7E6H51TZC', 'Date': 'Fri, 11 Nov 2022 01:10:03 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180729T000000, start_date=20221111T011001, end_date=20221111T011004 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-07-29T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:10:04.475870Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a4c13757-e24a-4fdd-9ab5-6b35b6b0c4c8"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..5d748e7d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:09:54.009567Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-29T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ab92932b-0032-31e5-b23d-e338b323cdbe"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ab92932b-0032-31e5-b23d-e338b323cdbe"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6fc5bfbf-18a2-4fe2-b70f-c7fed01e95b5"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-07-29T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:09:54.009567+00:00, try_number=1, job_id=956, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-29 00:00:00+00:00 +INFO - Started process 8008 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-07-29T00:00:00+00:00', '--job-id', '956', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp30r6_pdz'] +INFO - Job 956: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-29T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-29T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180729T000000, start_date=20221111T010954, end_date=20221111T011002 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-07-29T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:10:02.981131Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6fc5bfbf-18a2-4fe2-b70f-c7fed01e95b5"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..1c4dcd33 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-29T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:09:53.970038Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-29T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ab92932b-0032-31e5-b23d-e338b323cdbe"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ab92932b-0032-31e5-b23d-e338b323cdbe"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "be897bd4-4aaf-42dd-81df-7509446c28a0"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-07-29T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:09:53.970038+00:00, try_number=1, job_id=955, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-29 00:00:00+00:00 +INFO - Started process 8005 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-07-29T00:00:00+00:00', '--job-id', '955', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp5v0yl957'] +INFO - Job 955: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-29T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-29T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180729T000000, start_date=20221111T010953, end_date=20221111T010958 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-07-29T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:09:58.334891Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "be897bd4-4aaf-42dd-81df-7509446c28a0"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..15b0532a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:10:12.470126Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-30T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e7ea7a67-eddb-35c4-b008-9967fa1e6660"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e7ea7a67-eddb-35c4-b008-9967fa1e6660"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9143d463-b216-44a5-958b-655fa882bb48"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-07-30T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:10:12.470126+00:00, try_number=1, job_id=960, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-30 00:00:00+00:00 +INFO - Started process 8126 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-07-30T00:00:00+00:00', '--job-id', '960', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmprvmwk1q8'] +INFO - Job 960: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-30T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-30T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180730T000000, start_date=20221111T011012, end_date=20221111T011016 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-07-30T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:10:16.689188Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9143d463-b216-44a5-958b-655fa882bb48"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..ff0c603f --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:10:11.905601Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-30T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e7ea7a67-eddb-35c4-b008-9967fa1e6660"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e7ea7a67-eddb-35c4-b008-9967fa1e6660"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "75aef1a8-f5e9-4d44-89e7-7c7a2fc92ea4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-07-30T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:10:11.905601+00:00, try_number=1, job_id=959, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-30 00:00:00+00:00 +INFO - Started process 8123 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-07-30T00:00:00+00:00', '--job-id', '959', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpjnslju9t'] +INFO - Job 959: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-30T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-30T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180730T000000, start_date=20221111T011011, end_date=20221111T011015 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-07-30T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:10:15.958530Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "75aef1a8-f5e9-4d44-89e7-7c7a2fc92ea4"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..57f58914 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:10:30.993353Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-30T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e7ea7a67-eddb-35c4-b008-9967fa1e6660"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e7ea7a67-eddb-35c4-b008-9967fa1e6660"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "695d1598-810c-4f3c-8145-3ccee2603c1b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-07-30T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:10:30.993353+00:00, try_number=1, job_id=964, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-30 00:00:00+00:00 +INFO - Started process 8095 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-07-30T00:00:00+00:00', '--job-id', '964', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpioiqhpmr'] +INFO - Job 964: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-30T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-30T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0ca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '7DxfxIdThPRmbqzR7y+wSQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:7DxfxIdThPRmbqzR7y+wSQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011032Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011032Z +20221111/us-east-1/s3/aws4_request +d4ac699432acfb59a7d93b08760e20bf641f017978f84ec83eec03bab007f04c +INFO - '2022-11-11' - botocore.auth - Signature: +e7dd3d8ee2b50ce40537c5312e67be7a0b10e2043f18e9556385508a8c90388d +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'EuiF3fu50jX8ga9JN5Ud+rUqJquAhbNDdMuuMVh43NZvjBmlMqb//gVklNuRW3oRRrvlUrdOhQM=', 'x-amz-request-id': 'KFZ8TTKR4AZ7WWEB', 'Date': 'Fri, 11 Nov 2022 01:10:32 GMT', 'ETag': '"ec3c5fc4875384f4666eacd1ef2fb049"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180730T000000, start_date=20221111T011030, end_date=20221111T011033 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-07-30T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:10:33.421521Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "695d1598-810c-4f3c-8145-3ccee2603c1b"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..bbbb93be --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:10:28.974858Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-30T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e7ea7a67-eddb-35c4-b008-9967fa1e6660"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e7ea7a67-eddb-35c4-b008-9967fa1e6660"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "58eaef79-2f13-4e7b-a765-ebc89d31d6a2"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-07-30T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:10:28.974858+00:00, try_number=1, job_id=963, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-30 00:00:00+00:00 +INFO - Started process 8090 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-07-30T00:00:00+00:00', '--job-id', '963', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpfzgpwz97'] +INFO - Job 963: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-30T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-30T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499511f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011030Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011030Z +20221111/us-east-1/s3/aws4_request +2df40d6f666c22689f5b8ed32dbff27626e550566d50c5a98d87647981857321 +INFO - '2022-11-11' - botocore.auth - Signature: +b8499822701b6b5dbc18b7a221e04e8d23d2cf9c5f9773e950df42044cbe1686 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '9K5UAE4p8vE7M9VU7KwM0CqO6D0jmkt+5k9p+S319QFj44eCiZSqj7oyM2uKCaDjeJ/34dw4+60=', 'x-amz-request-id': 'DAYJTE6X32RXWD7Z', 'Date': 'Fri, 11 Nov 2022 01:10:31 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180730T000000, start_date=20221111T011028, end_date=20221111T011032 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-07-30T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:10:32.194695Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "58eaef79-2f13-4e7b-a765-ebc89d31d6a2"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..095e3f47 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:10:20.143088Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-30T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e7ea7a67-eddb-35c4-b008-9967fa1e6660"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e7ea7a67-eddb-35c4-b008-9967fa1e6660"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "105e8692-9638-42db-bfbd-b04d2197a135"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-07-30T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:10:20.143088+00:00, try_number=1, job_id=962, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-30 00:00:00+00:00 +INFO - Started process 8073 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-07-30T00:00:00+00:00', '--job-id', '962', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp9opmhrrt'] +INFO - Job 962: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-30T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-30T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180730T000000, start_date=20221111T011020, end_date=20221111T011028 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-07-30T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:10:28.987554Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "105e8692-9638-42db-bfbd-b04d2197a135"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..dc8d4c22 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-30T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:10:19.070594Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-30T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e7ea7a67-eddb-35c4-b008-9967fa1e6660"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "e7ea7a67-eddb-35c4-b008-9967fa1e6660"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f00402a1-d292-4986-9697-1eb3a7b23f4e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-07-30T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:10:19.070594+00:00, try_number=1, job_id=961, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-30 00:00:00+00:00 +INFO - Started process 8065 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-07-30T00:00:00+00:00', '--job-id', '961', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpd2u1v74t'] +INFO - Job 961: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-30T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-30T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180730T000000, start_date=20221111T011019, end_date=20221111T011026 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-07-30T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:10:26.269200Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f00402a1-d292-4986-9697-1eb3a7b23f4e"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..8eef2025 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:10:36.380671Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-31T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0b84a761-4c2f-3b5a-8836-b164c3dc168a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0b84a761-4c2f-3b5a-8836-b164c3dc168a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1458cbfa-2890-4a5d-83ca-8127e3b2feed"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-07-31T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:10:36.380671+00:00, try_number=1, job_id=965, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-31 00:00:00+00:00 +INFO - Started process 8105 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-07-31T00:00:00+00:00', '--job-id', '965', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp4mxil87n'] +INFO - Job 965: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-31T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-31T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180731T000000, start_date=20221111T011036, end_date=20221111T011040 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-07-31T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:10:40.358526Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1458cbfa-2890-4a5d-83ca-8127e3b2feed"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..f133305c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:10:36.699396Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-31T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0b84a761-4c2f-3b5a-8836-b164c3dc168a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0b84a761-4c2f-3b5a-8836-b164c3dc168a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4a50919c-366d-46ad-8c9f-ba50089e92b4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-07-31T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:10:36.699396+00:00, try_number=1, job_id=966, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-31 00:00:00+00:00 +INFO - Started process 8107 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-07-31T00:00:00+00:00', '--job-id', '966', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpdue4e8sc'] +INFO - Job 966: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-31T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-31T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180731T000000, start_date=20221111T011036, end_date=20221111T011040 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-07-31T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:10:40.433031Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4a50919c-366d-46ad-8c9f-ba50089e92b4"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..5d5f0472 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:10:52.371225Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-31T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0b84a761-4c2f-3b5a-8836-b164c3dc168a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0b84a761-4c2f-3b5a-8836-b164c3dc168a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "41d0dd81-e2bd-45ee-a15b-2970459389f6"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-07-31T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:10:52.371225+00:00, try_number=1, job_id=970, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-31 00:00:00+00:00 +INFO - Started process 8142 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-07-31T00:00:00+00:00', '--job-id', '970', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpqbtdczh7'] +INFO - Job 970: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-31T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-31T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6ee0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'nCuQgXtYHt2tMAqFA3cGLA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:nCuQgXtYHt2tMAqFA3cGLA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011053Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011053Z +20221111/us-east-1/s3/aws4_request +23c93ba986b6f3e9ae8053196525f4f87257f02785fe6a14671b94b7f12aa21e +INFO - '2022-11-11' - botocore.auth - Signature: +e7c8f7ce2685e89bc738a891a3925efa44cfde99aba9268a5a9928eaaf66be78 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'nbZ7vlK4+Pl74jmMEssFSXU3P64wXs4yBtOj934a2u8a59Vp4j+s/siwf/7CjBPegfifMPNbnmQ=', 'x-amz-request-id': 'JJSFS4MXKW3JYFJ2', 'Date': 'Fri, 11 Nov 2022 01:10:53 GMT', 'ETag': '"9c2b90817b581eddad300a850377062c"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180731T000000, start_date=20221111T011052, end_date=20221111T011054 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-07-31T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:10:54.555623Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "41d0dd81-e2bd-45ee-a15b-2970459389f6"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..6cd5ca41 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:10:50.132948Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-31T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0b84a761-4c2f-3b5a-8836-b164c3dc168a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0b84a761-4c2f-3b5a-8836-b164c3dc168a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9eb35bcb-5b2c-4c2d-ac28-297e42a09d08"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-07-31T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:10:50.132948+00:00, try_number=1, job_id=969, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-31 00:00:00+00:00 +INFO - Started process 8168 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-07-31T00:00:00+00:00', '--job-id', '969', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpuvip67_b'] +INFO - Job 969: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-31T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-31T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499553a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011051Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011051Z +20221111/us-east-1/s3/aws4_request +99fc49a9cf3293e4811184fc3341c927fda3e84cca0dbbca0480b8c17fa608e1 +INFO - '2022-11-11' - botocore.auth - Signature: +49fb7ddffe79f57441b3b947982df9e41668432683f73fdac3f083faea75a539 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'YUG2vDl3ZNr6be13JXw3ro7O2MzRUYQ2QflrbYpsBp5xKGANnmqmyzHYY6wCUWyqSPwJnjL9aZE=', 'x-amz-request-id': 'B2KVEVHTV6NGNZE9', 'Date': 'Fri, 11 Nov 2022 01:10:51 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180731T000000, start_date=20221111T011050, end_date=20221111T011052 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-07-31T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:10:52.693656Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9eb35bcb-5b2c-4c2d-ac28-297e42a09d08"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..a0a275b8 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:10:42.656145Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-31T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0b84a761-4c2f-3b5a-8836-b164c3dc168a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0b84a761-4c2f-3b5a-8836-b164c3dc168a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b65aea3c-4a22-4b98-8684-d2ac85690bbf"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-07-31T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:10:42.656145+00:00, try_number=1, job_id=967, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-31 00:00:00+00:00 +INFO - Started process 8132 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-07-31T00:00:00+00:00', '--job-id', '967', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpy7ox2nf_'] +INFO - Job 967: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-31T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-31T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180731T000000, start_date=20221111T011042, end_date=20221111T011050 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-07-31T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:10:50.310307Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b65aea3c-4a22-4b98-8684-d2ac85690bbf"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..f6ac836c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-07-31T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:10:43.497751Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-07-31T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0b84a761-4c2f-3b5a-8836-b164c3dc168a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0b84a761-4c2f-3b5a-8836-b164c3dc168a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3f473494-6617-4c91-abd1-af671ca84bff"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-07-31T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:10:43.497751+00:00, try_number=1, job_id=968, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-07-31 00:00:00+00:00 +INFO - Started process 8113 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-07-31T00:00:00+00:00', '--job-id', '968', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpt086zocr'] +INFO - Job 968: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-07-31T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-07-31T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180731T000000, start_date=20221111T011043, end_date=20221111T011047 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-07-31T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:10:47.055967Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3f473494-6617-4c91-abd1-af671ca84bff"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..ea660d13 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:10:57.066448Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8328627a-7b1d-3b5d-95eb-ca0a70701251"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8328627a-7b1d-3b5d-95eb-ca0a70701251"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a6458fc9-9791-4dbd-9cd3-922600a75f00"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-08-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:10:57.066448+00:00, try_number=1, job_id=971, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-01 00:00:00+00:00 +INFO - Started process 8191 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-08-01T00:00:00+00:00', '--job-id', '971', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpfq50zys_'] +INFO - Job 971: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180801T000000, start_date=20221111T011057, end_date=20221111T011101 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-08-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:11:01.873367Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a6458fc9-9791-4dbd-9cd3-922600a75f00"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..d0378532 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:10:58.166941Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8328627a-7b1d-3b5d-95eb-ca0a70701251"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8328627a-7b1d-3b5d-95eb-ca0a70701251"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fcab1ad5-34b1-482f-a309-df745cb2850d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-08-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:10:58.166941+00:00, try_number=1, job_id=972, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-01 00:00:00+00:00 +INFO - Started process 8194 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-08-01T00:00:00+00:00', '--job-id', '972', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp69pok0ib'] +INFO - Job 972: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180801T000000, start_date=20221111T011058, end_date=20221111T011102 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-08-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:11:02.256477Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fcab1ad5-34b1-482f-a309-df745cb2850d"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..42367c56 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:11:20.822336Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8328627a-7b1d-3b5d-95eb-ca0a70701251"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8328627a-7b1d-3b5d-95eb-ca0a70701251"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f41723aa-fcc0-4fe3-91b1-80ad02832127"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-08-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:11:20.822336+00:00, try_number=1, job_id=976, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-01 00:00:00+00:00 +INFO - Started process 8217 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-08-01T00:00:00+00:00', '--job-id', '976', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpz_w2ujde'] +INFO - Job 976: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0ca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '5/Cvu3t6lOFzkyYXOSzgZg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:5/Cvu3t6lOFzkyYXOSzgZg== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011122Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011122Z +20221111/us-east-1/s3/aws4_request +9ad4068699b2b133203b5a754b6b46315e15dd5fb848c6c942be46f06b05d64c +INFO - '2022-11-11' - botocore.auth - Signature: +c88ed94654e054e8c3e505dffe05e9da313ef109397166cf2762d2e522d83e1d +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '8Gj9aW25KbgtYcBKf4fdnY06TQ/di8VIYGrjVskXffeijp8Vh+7ccGwbhYAqTT8SAfp8lLoo6QY=', 'x-amz-request-id': '7E2WTRT03P0550AD', 'Date': 'Fri, 11 Nov 2022 01:11:22 GMT', 'ETag': '"e7f0afbb7b7a94e173932617392ce066"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180801T000000, start_date=20221111T011120, end_date=20221111T011123 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-08-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:11:23.699735Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f41723aa-fcc0-4fe3-91b1-80ad02832127"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..b333ef30 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:11:15.825806Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8328627a-7b1d-3b5d-95eb-ca0a70701251"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8328627a-7b1d-3b5d-95eb-ca0a70701251"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "311102b4-a403-4a70-9953-d643be1c22d3"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-08-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:11:15.825806+00:00, try_number=1, job_id=975, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-01 00:00:00+00:00 +INFO - Started process 8209 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-08-01T00:00:00+00:00', '--job-id', '975', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpmb9rqdgf'] +INFO - Job 975: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499521f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011117Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011117Z +20221111/us-east-1/s3/aws4_request +01179fbdeb54f4b26adca3b03c1cee991ef91cd96309741d6d64251bfef50557 +INFO - '2022-11-11' - botocore.auth - Signature: +edb6c1f2d81c5af1d3f24951bb961a8d826a549c7f4dd7b21bd842a156d8b013 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'Q+AERGTYGRT0tseJaNfahmWht+52z4OB3bL/jbsrV3QZ1VoI3LovnLolNMN8tMHNR23M4WuZ2P8=', 'x-amz-request-id': 'JEN1T60401VMK3TZ', 'Date': 'Fri, 11 Nov 2022 01:11:18 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180801T000000, start_date=20221111T011115, end_date=20221111T011118 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-08-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:11:18.974815Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "311102b4-a403-4a70-9953-d643be1c22d3"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..601dfcaa --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:11:07.149257Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8328627a-7b1d-3b5d-95eb-ca0a70701251"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8328627a-7b1d-3b5d-95eb-ca0a70701251"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2361b589-8c09-4478-b952-428624edf3aa"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-08-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:11:07.149257+00:00, try_number=1, job_id=974, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-01 00:00:00+00:00 +INFO - Started process 8204 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-08-01T00:00:00+00:00', '--job-id', '974', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpseeyqhka'] +INFO - Job 974: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180801T000000, start_date=20221111T011107, end_date=20221111T011118 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-08-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:11:18.289413Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2361b589-8c09-4478-b952-428624edf3aa"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..91a39e19 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-01T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:11:06.257591Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-01T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8328627a-7b1d-3b5d-95eb-ca0a70701251"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8328627a-7b1d-3b5d-95eb-ca0a70701251"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f261c06b-219b-4db7-96b3-87b5fd9afde4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-08-01T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:11:06.257591+00:00, try_number=1, job_id=973, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-01 00:00:00+00:00 +INFO - Started process 8201 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-08-01T00:00:00+00:00', '--job-id', '973', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpim_87d9i'] +INFO - Job 973: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-01T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-01T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180801T000000, start_date=20221111T011106, end_date=20221111T011111 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-08-01T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:11:11.206839Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f261c06b-219b-4db7-96b3-87b5fd9afde4"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..d8960378 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:11:29.585674Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "39d35b78-6e3c-31b8-bf3d-bdf0f1da9038"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "39d35b78-6e3c-31b8-bf3d-bdf0f1da9038"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "25338c92-6cec-4d27-8ba3-f6879e973f6d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-08-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:11:29.585674+00:00, try_number=1, job_id=978, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-02 00:00:00+00:00 +INFO - Started process 8228 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-08-02T00:00:00+00:00', '--job-id', '978', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp1wa4lmwe'] +INFO - Job 978: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180802T000000, start_date=20221111T011129, end_date=20221111T011133 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-08-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:11:33.269824Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "25338c92-6cec-4d27-8ba3-f6879e973f6d"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..9f4f5dc7 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:11:27.434684Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "39d35b78-6e3c-31b8-bf3d-bdf0f1da9038"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "39d35b78-6e3c-31b8-bf3d-bdf0f1da9038"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "835602db-f5b2-4b05-989e-5c5f498f33bd"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-08-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:11:27.434684+00:00, try_number=1, job_id=977, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-02 00:00:00+00:00 +INFO - Started process 8225 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-08-02T00:00:00+00:00', '--job-id', '977', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmphlwtofve'] +INFO - Job 977: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180802T000000, start_date=20221111T011127, end_date=20221111T011132 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-08-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:11:32.121044Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "835602db-f5b2-4b05-989e-5c5f498f33bd"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..bc1a8a53 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:11:56.991985Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "39d35b78-6e3c-31b8-bf3d-bdf0f1da9038"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "39d35b78-6e3c-31b8-bf3d-bdf0f1da9038"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "82b4ff63-fc07-47aa-b543-3ae19e8ed7d0"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-08-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:11:56.991985+00:00, try_number=1, job_id=982, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-02 00:00:00+00:00 +INFO - Started process 8251 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-08-02T00:00:00+00:00', '--job-id', '982', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp1hlm7y6r'] +INFO - Job 982: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f2f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '5/Cvu3t6lOFzkyYXOSzgZg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:5/Cvu3t6lOFzkyYXOSzgZg== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011158Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011158Z +20221111/us-east-1/s3/aws4_request +6e0699cebf9fab56761100a72269f353e2eb0b2c641dc463592ff154b334c1da +INFO - '2022-11-11' - botocore.auth - Signature: +a85316e31bada3ec758426cc933eda796f49e024bdd5db65220cf757acf3838f +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'flKU09uHaU1TtTFit1a4JpwVB3vJCkP44LG03nuqcECOCaT4vcE4SFrCQ0m9o/cvb5pUZIR9JrU=', 'x-amz-request-id': '68FNC0NE388RMTE4', 'Date': 'Fri, 11 Nov 2022 01:11:59 GMT', 'ETag': '"e7f0afbb7b7a94e173932617392ce066"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180802T000000, start_date=20221111T011156, end_date=20221111T011200 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-08-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:12:00.132586Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "82b4ff63-fc07-47aa-b543-3ae19e8ed7d0"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..9fd8bc84 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:11:42.719744Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "39d35b78-6e3c-31b8-bf3d-bdf0f1da9038"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "39d35b78-6e3c-31b8-bf3d-bdf0f1da9038"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8d400bd6-e03c-4215-a45b-5870d0f436dc"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-08-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:11:42.719744+00:00, try_number=1, job_id=981, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-02 00:00:00+00:00 +INFO - Started process 8239 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-08-02T00:00:00+00:00', '--job-id', '981', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp36s3z_n7'] +INFO - Job 981: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f6249956550> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011144Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011144Z +20221111/us-east-1/s3/aws4_request +eefb64e0a8337872b576892282edec30d8ab3373ecfdb80ba5b9651897e5d5d9 +INFO - '2022-11-11' - botocore.auth - Signature: +16706387641110ec72998db496a59b489c7bc9d535e4830b7d49ff08ebdf3e15 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'hMsJCwFGjyNBzTWps5gQMpwa93YODPKqTuoE9pyPQpDH5mw0imkHeAf/dpiveCltkG6o7aI+qGI=', 'x-amz-request-id': 'KY928DYKRCDJM3NW', 'Date': 'Fri, 11 Nov 2022 01:11:44 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180802T000000, start_date=20221111T011142, end_date=20221111T011145 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-08-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:11:45.318453Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8d400bd6-e03c-4215-a45b-5870d0f436dc"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..fc4c879b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:11:38.328573Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "39d35b78-6e3c-31b8-bf3d-bdf0f1da9038"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "39d35b78-6e3c-31b8-bf3d-bdf0f1da9038"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b329fabe-3531-4ac0-9642-f6d19abb359f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-08-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:11:38.328573+00:00, try_number=1, job_id=980, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-02 00:00:00+00:00 +INFO - Started process 8149 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-08-02T00:00:00+00:00', '--job-id', '980', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpc4tlhzz_'] +INFO - Job 980: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180802T000000, start_date=20221111T011138, end_date=20221111T011155 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-08-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:11:55.254175Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b329fabe-3531-4ac0-9642-f6d19abb359f"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..483251bd --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-02T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:11:35.498800Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-02T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "39d35b78-6e3c-31b8-bf3d-bdf0f1da9038"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "39d35b78-6e3c-31b8-bf3d-bdf0f1da9038"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f283ad67-28da-4f75-bd3d-ed2abee03b6a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-08-02T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:11:35.498800+00:00, try_number=1, job_id=979, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-02 00:00:00+00:00 +INFO - Started process 8234 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-08-02T00:00:00+00:00', '--job-id', '979', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp5ionb351'] +INFO - Job 979: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-02T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-02T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180802T000000, start_date=20221111T011135, end_date=20221111T011139 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-08-02T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:11:39.196999Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f283ad67-28da-4f75-bd3d-ed2abee03b6a"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..ee581f26 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:12:05.024003Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f0e2ab8-027f-3bd8-954e-46a1862978ec"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f0e2ab8-027f-3bd8-954e-46a1862978ec"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8d4ed4b5-2b36-44ae-9b9a-078d24209353"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-08-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:12:05.024003+00:00, try_number=1, job_id=984, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-03 00:00:00+00:00 +INFO - Started process 8262 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-08-03T00:00:00+00:00', '--job-id', '984', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpgktgbxnt'] +INFO - Job 984: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180803T000000, start_date=20221111T011205, end_date=20221111T011208 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-08-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:12:08.363553Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8d4ed4b5-2b36-44ae-9b9a-078d24209353"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..48912e91 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:12:04.848264Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f0e2ab8-027f-3bd8-954e-46a1862978ec"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f0e2ab8-027f-3bd8-954e-46a1862978ec"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5fc83155-d528-47fd-bcd2-e1223c567311"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-08-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:12:04.848264+00:00, try_number=1, job_id=983, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-03 00:00:00+00:00 +INFO - Started process 8259 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-08-03T00:00:00+00:00', '--job-id', '983', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpxnny3k9r'] +INFO - Job 983: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180803T000000, start_date=20221111T011204, end_date=20221111T011207 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-08-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:12:07.963600Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5fc83155-d528-47fd-bcd2-e1223c567311"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..4e50d036 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:12:26.604920Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f0e2ab8-027f-3bd8-954e-46a1862978ec"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f0e2ab8-027f-3bd8-954e-46a1862978ec"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "17283421-771d-49d1-a033-73b1c178e768"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-08-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:12:26.604920+00:00, try_number=1, job_id=988, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-03 00:00:00+00:00 +INFO - Started process 8285 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-08-03T00:00:00+00:00', '--job-id', '988', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpm2dqk0ev'] +INFO - Job 988: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f1940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'sbw1o6zCRuC5WN21iDQkTg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:sbw1o6zCRuC5WN21iDQkTg== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011228Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011228Z +20221111/us-east-1/s3/aws4_request +ed43d0f5f2615440284ffab1ff9395537a0b438a5ab0234b9709fd58bf4af522 +INFO - '2022-11-11' - botocore.auth - Signature: +00d794a107404b8843914f849a737fafeac0b1ad73f5c5bccb64ae022c26665b +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'An2zOxvQ7G+dWHgzvWvABKt6OrtVYBb1mQbl6gsYQu1pFVM8gLXfJIM00GGOuhFy31T8kvpa+Ho=', 'x-amz-request-id': 'C08ZN0RGRX4D0S8Q', 'Date': 'Fri, 11 Nov 2022 01:12:28 GMT', 'ETag': '"b1bc35a3acc246e0b958ddb58834244e"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180803T000000, start_date=20221111T011226, end_date=20221111T011229 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-08-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:12:29.524602Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "17283421-771d-49d1-a033-73b1c178e768"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..35bd8ca8 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:12:19.214931Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f0e2ab8-027f-3bd8-954e-46a1862978ec"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f0e2ab8-027f-3bd8-954e-46a1862978ec"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1fdab60b-d339-4525-b71c-2e8cd564ac9e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-08-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:12:19.214931+00:00, try_number=1, job_id=987, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-03 00:00:00+00:00 +INFO - Started process 8277 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-08-03T00:00:00+00:00', '--job-id', '987', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpgis__dhn'] +INFO - Job 987: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f6249954550> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011220Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011220Z +20221111/us-east-1/s3/aws4_request +fab908247b4352590fc192e49884b73a30286b6e4e30553fcedc267fe335b3c3 +INFO - '2022-11-11' - botocore.auth - Signature: +0530aac75c1860216be422d4b27cc77b939c1ad1a988eb9f5f21d11e82cc2fe6 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '/pPBgmWQTtynYGaMdmVRaRv9G9b3n15UA+cO+ngF0SnmrJ23ZqoF2D3+b+Dwst435BT/21tIadZLZ7XGNOCQAA==', 'x-amz-request-id': 'W651EVKVWN2C6RK8', 'Date': 'Fri, 11 Nov 2022 01:12:21 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180803T000000, start_date=20221111T011219, end_date=20221111T011222 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-08-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:12:22.411748Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1fdab60b-d339-4525-b71c-2e8cd564ac9e"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..dfcc9635 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:12:11.826365Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f0e2ab8-027f-3bd8-954e-46a1862978ec"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f0e2ab8-027f-3bd8-954e-46a1862978ec"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7a4a1d14-ba4e-4fdc-8f31-80dcd663793d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-08-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:12:11.826365+00:00, try_number=1, job_id=986, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-03 00:00:00+00:00 +INFO - Started process 8272 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-08-03T00:00:00+00:00', '--job-id', '986', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp3esgpwaw'] +INFO - Job 986: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180803T000000, start_date=20221111T011211, end_date=20221111T011224 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-08-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:12:24.091474Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7a4a1d14-ba4e-4fdc-8f31-80dcd663793d"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..95e43f3b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-03T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:12:11.096305Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-03T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f0e2ab8-027f-3bd8-954e-46a1862978ec"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3f0e2ab8-027f-3bd8-954e-46a1862978ec"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "dc48f0f5-d14e-4d1f-a937-3ca96e3e7c17"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-08-03T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:12:11.096305+00:00, try_number=1, job_id=985, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-03 00:00:00+00:00 +INFO - Started process 8269 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-08-03T00:00:00+00:00', '--job-id', '985', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp82qobouo'] +INFO - Job 985: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-03T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-03T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180803T000000, start_date=20221111T011211, end_date=20221111T011214 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-08-03T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:12:14.659063Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "dc48f0f5-d14e-4d1f-a937-3ca96e3e7c17"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..c1b908a2 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:12:36.003386Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b1f8d54b-bec3-3841-b4e3-69834a849ed5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b1f8d54b-bec3-3841-b4e3-69834a849ed5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "26c002f3-918c-451c-aeb7-3ff13d02d38b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-08-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:12:36.003386+00:00, try_number=1, job_id=990, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-04 00:00:00+00:00 +INFO - Started process 8293 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-08-04T00:00:00+00:00', '--job-id', '990', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpq58wc7b7'] +INFO - Job 990: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180804T000000, start_date=20221111T011236, end_date=20221111T011239 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-08-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:12:39.805335Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "26c002f3-918c-451c-aeb7-3ff13d02d38b"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..31feed8b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:12:36.149352Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b1f8d54b-bec3-3841-b4e3-69834a849ed5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b1f8d54b-bec3-3841-b4e3-69834a849ed5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6b8979cf-4e1d-477a-aaa3-e44f41a22db9"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-08-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:12:36.149352+00:00, try_number=1, job_id=989, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-04 00:00:00+00:00 +INFO - Started process 8296 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-08-04T00:00:00+00:00', '--job-id', '989', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmptvreq6af'] +INFO - Job 989: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180804T000000, start_date=20221111T011236, end_date=20221111T011239 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-08-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:12:39.700241Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6b8979cf-4e1d-477a-aaa3-e44f41a22db9"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..f0e77808 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:12:58.377391Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b1f8d54b-bec3-3841-b4e3-69834a849ed5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b1f8d54b-bec3-3841-b4e3-69834a849ed5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6bb66646-bec8-49ea-b162-d66f9047e995"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-08-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:12:58.377391+00:00, try_number=1, job_id=994, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-04 00:00:00+00:00 +INFO - Started process 8312 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-08-04T00:00:00+00:00', '--job-id', '994', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp35pkmagv'] +INFO - Job 994: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'sbw1o6zCRuC5WN21iDQkTg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:sbw1o6zCRuC5WN21iDQkTg== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011259Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011259Z +20221111/us-east-1/s3/aws4_request +7ba4f3d95aee42ca418457160056ca72fdf6d8290d1854490408289ef41099cf +INFO - '2022-11-11' - botocore.auth - Signature: +d580720221f38b4ddaafa2ffd4d86bb7e571f0ca783722cff4e8bc36dbdb6772 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'nAm/75SAKDhipDHtcCX2N/EMxNcPT5NEc2FI6GWesXidsEqaqDbYM5lJhsX9Q+oiR1qKwd5KsLc=', 'x-amz-request-id': '80TM8TGAYB8K9F3K', 'Date': 'Fri, 11 Nov 2022 01:13:00 GMT', 'ETag': '"b1bc35a3acc246e0b958ddb58834244e"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180804T000000, start_date=20221111T011258, end_date=20221111T011301 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-08-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:13:01.726831Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6bb66646-bec8-49ea-b162-d66f9047e995"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..5e9972ed --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:12:48.455037Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b1f8d54b-bec3-3841-b4e3-69834a849ed5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b1f8d54b-bec3-3841-b4e3-69834a849ed5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e2402439-4882-47f2-9097-0a916650b810"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-08-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:12:48.455037+00:00, try_number=1, job_id=993, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-04 00:00:00+00:00 +INFO - Started process 8168 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-08-04T00:00:00+00:00', '--job-id', '993', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp3sdq0icq'] +INFO - Job 993: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50041f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011249Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011249Z +20221111/us-east-1/s3/aws4_request +8a5b85c8263ca6ce1abef2e03d91ad4e1bb646d5230079e8ab9c397042fe04ec +INFO - '2022-11-11' - botocore.auth - Signature: +79e1853ffeb606dbf79a671a70c5dcf26140d14c188af7e9763ff4f2fcf857b4 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'vrC8Rp6NmsQ4sjcIG8wgpr0zpCW6xvwoo0kMu3PlJBa0fVF4Gu7d9H3r4e8X0qF/hPx+gfK41wI=', 'x-amz-request-id': 'NVDTP40NC661QDD2', 'Date': 'Fri, 11 Nov 2022 01:12:50 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180804T000000, start_date=20221111T011248, end_date=20221111T011251 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-08-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:12:51.467888Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e2402439-4882-47f2-9097-0a916650b810"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..e2507eff --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:12:43.964728Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b1f8d54b-bec3-3841-b4e3-69834a849ed5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b1f8d54b-bec3-3841-b4e3-69834a849ed5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1649e7fc-5736-4f8c-9ed9-65b3b8c2bdc8"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-08-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:12:43.964728+00:00, try_number=1, job_id=992, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-04 00:00:00+00:00 +INFO - Started process 8164 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-08-04T00:00:00+00:00', '--job-id', '992', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpr7643gn3'] +INFO - Job 992: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180804T000000, start_date=20221111T011243, end_date=20221111T011254 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-08-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:12:54.256204Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1649e7fc-5736-4f8c-9ed9-65b3b8c2bdc8"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..f1d02f9c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-04T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:12:42.753709Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-04T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b1f8d54b-bec3-3841-b4e3-69834a849ed5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b1f8d54b-bec3-3841-b4e3-69834a849ed5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8b7ebd18-c0df-4d64-89f7-e251ba32680f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-08-04T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:12:42.753709+00:00, try_number=1, job_id=991, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-04 00:00:00+00:00 +INFO - Started process 8302 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-08-04T00:00:00+00:00', '--job-id', '991', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpoih9lasf'] +INFO - Job 991: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-04T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-04T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180804T000000, start_date=20221111T011242, end_date=20221111T011245 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-08-04T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:12:45.757703Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8b7ebd18-c0df-4d64-89f7-e251ba32680f"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..d731e706 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:13:06.618376Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2ce9dc0d-1a08-3177-b5aa-0c018a5fd8f7"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2ce9dc0d-1a08-3177-b5aa-0c018a5fd8f7"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4084439a-deb9-472d-ba7e-a14cede26ac3"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-08-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:13:06.618376+00:00, try_number=1, job_id=995, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-05 00:00:00+00:00 +INFO - Started process 8177 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-08-05T00:00:00+00:00', '--job-id', '995', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpvymjae57'] +INFO - Job 995: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180805T000000, start_date=20221111T011306, end_date=20221111T011310 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-08-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:13:10.679985Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4084439a-deb9-472d-ba7e-a14cede26ac3"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..f322f9d6 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:13:08.097037Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2ce9dc0d-1a08-3177-b5aa-0c018a5fd8f7"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2ce9dc0d-1a08-3177-b5aa-0c018a5fd8f7"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ff6412a5-e8d7-45cd-8dd0-b59f6063ccda"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-08-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:13:08.097037+00:00, try_number=1, job_id=996, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-05 00:00:00+00:00 +INFO - Started process 8180 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-08-05T00:00:00+00:00', '--job-id', '996', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmphszvkhwj'] +INFO - Job 996: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180805T000000, start_date=20221111T011308, end_date=20221111T011312 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-08-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:13:12.300551Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ff6412a5-e8d7-45cd-8dd0-b59f6063ccda"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..c6256aa2 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:13:31.862386Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2ce9dc0d-1a08-3177-b5aa-0c018a5fd8f7"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2ce9dc0d-1a08-3177-b5aa-0c018a5fd8f7"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9db95f97-2f8b-49d2-a426-e5dd2f0e71da"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-08-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:13:31.862386+00:00, try_number=1, job_id=1000, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-05 00:00:00+00:00 +INFO - Started process 8196 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-08-05T00:00:00+00:00', '--job-id', '1000', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp4i8f9ui_'] +INFO - Job 1000: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa4f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'IXD2ZU/2RcumJsSJiKCQYw==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:IXD2ZU/2RcumJsSJiKCQYw== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011334Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011334Z +20221111/us-east-1/s3/aws4_request +c8bcbd2a83b318fb3a20efec0b1fc6b33e06e2fc38acb2341df8e95904d55212 +INFO - '2022-11-11' - botocore.auth - Signature: +bee6a9cdb34048fa15c9920d6d80be3a9e7f822c05eb5dad231ea99359027de7 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '/a2krtaqKp9sdeVwNQxUNUbjQj7nFN4p6GaOgG7xSd4dY39fQQmbIJB5w4GZZIMtKtV1rxllLgQ=', 'x-amz-request-id': 'B92ZN1T57BPG3CFG', 'Date': 'Fri, 11 Nov 2022 01:13:35 GMT', 'ETag': '"2170f6654ff645cba626c48988a09063"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180805T000000, start_date=20221111T011331, end_date=20221111T011336 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-08-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:13:36.649802Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9db95f97-2f8b-49d2-a426-e5dd2f0e71da"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..f7882d2d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:13:25.750473Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2ce9dc0d-1a08-3177-b5aa-0c018a5fd8f7"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2ce9dc0d-1a08-3177-b5aa-0c018a5fd8f7"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1c63b726-483b-4eaa-a03a-cfa9a1b6e2de"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-08-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:13:25.750473+00:00, try_number=1, job_id=999, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-05 00:00:00+00:00 +INFO - Started process 8323 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-08-05T00:00:00+00:00', '--job-id', '999', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpxts6mbip'] +INFO - Job 999: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f6249953550> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011328Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011328Z +20221111/us-east-1/s3/aws4_request +f91f59c5d8f0b2d807f61f36796e1141eaf6a8ae946c3ea3827ef770639342f0 +INFO - '2022-11-11' - botocore.auth - Signature: +017859ad2e0f4150853e688d2f655c8c9e185062457a80b307057edfe1c5bb6d +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '/HxA1MCX0kzrtwtT9KCL2scU+36DX6CSi4+wuBnLvIs3VhVP7OH7gSlvgMVvW69CQzh1b5mQuKE=', 'x-amz-request-id': '31SR0RZGRXDF8YAE', 'Date': 'Fri, 11 Nov 2022 01:13:29 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180805T000000, start_date=20221111T011325, end_date=20221111T011330 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-08-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:13:30.071940Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1c63b726-483b-4eaa-a03a-cfa9a1b6e2de"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..af56536c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:13:14.089108Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2ce9dc0d-1a08-3177-b5aa-0c018a5fd8f7"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2ce9dc0d-1a08-3177-b5aa-0c018a5fd8f7"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4ce39c52-a556-406a-b180-dd779ea346ea"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-08-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:13:14.089108+00:00, try_number=1, job_id=997, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-05 00:00:00+00:00 +INFO - Started process 8319 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-08-05T00:00:00+00:00', '--job-id', '997', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpua7qvnx_'] +INFO - Job 997: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180805T000000, start_date=20221111T011314, end_date=20221111T011327 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-08-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:13:27.193773Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4ce39c52-a556-406a-b180-dd779ea346ea"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..36978e22 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-05T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:13:15.448840Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-05T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2ce9dc0d-1a08-3177-b5aa-0c018a5fd8f7"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "2ce9dc0d-1a08-3177-b5aa-0c018a5fd8f7"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6ad4ccee-415b-47cf-9759-f71649faf8be"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-08-05T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:13:15.448840+00:00, try_number=1, job_id=998, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-05 00:00:00+00:00 +INFO - Started process 8186 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-08-05T00:00:00+00:00', '--job-id', '998', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpfumwa739'] +INFO - Job 998: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-05T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-05T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180805T000000, start_date=20221111T011315, end_date=20221111T011320 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-08-05T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:13:20.163978Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6ad4ccee-415b-47cf-9759-f71649faf8be"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..47396cfd --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:13:42.484458Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a7d8269b-06b9-3fed-875a-a1326f6e3532"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a7d8269b-06b9-3fed-875a-a1326f6e3532"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "61395c01-9972-4a03-b55d-694248092aee"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-08-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:13:42.484458+00:00, try_number=1, job_id=1001, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-06 00:00:00+00:00 +INFO - Started process 8338 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-08-06T00:00:00+00:00', '--job-id', '1001', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp1ddl6sbg'] +INFO - Job 1001: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180806T000000, start_date=20221111T011342, end_date=20221111T011347 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-08-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:13:47.687372Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "61395c01-9972-4a03-b55d-694248092aee"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..874d1110 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:13:42.541170Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a7d8269b-06b9-3fed-875a-a1326f6e3532"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a7d8269b-06b9-3fed-875a-a1326f6e3532"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e2b69596-240b-403e-9be7-5d7893b58d45"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-08-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:13:42.541170+00:00, try_number=1, job_id=1002, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-06 00:00:00+00:00 +INFO - Started process 8340 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-08-06T00:00:00+00:00', '--job-id', '1002', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpvidg41lp'] +INFO - Job 1002: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180806T000000, start_date=20221111T011342, end_date=20221111T011348 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-08-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:13:48.032850Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e2b69596-240b-403e-9be7-5d7893b58d45"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..5a94aae0 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:14:15.715400Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a7d8269b-06b9-3fed-875a-a1326f6e3532"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a7d8269b-06b9-3fed-875a-a1326f6e3532"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ddfbc639-2e32-4814-a184-086db496ef3b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-08-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:14:15.715400+00:00, try_number=1, job_id=1006, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-06 00:00:00+00:00 +INFO - Started process 8363 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-08-06T00:00:00+00:00', '--job-id', '1006', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpsxmdtlli'] +INFO - Job 1006: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498efee0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'v0srp6JdtSTHAOwbbIN6Vg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:v0srp6JdtSTHAOwbbIN6Vg== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011417Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011417Z +20221111/us-east-1/s3/aws4_request +1e365f0cd0f851ecb455a12f3ba69ccdd53d4d0923bfbd2c88542fbf69e4be49 +INFO - '2022-11-11' - botocore.auth - Signature: +ffee4e4aac67b039d1077e408cbf50c750638de6ab9d4a587bba2b804d7a03dc +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'zDNbkdTiT0+QuaoHxSrNOy4sOa0q25xzSZyAE/5tNKNz0Stql7Ys7Hlr/K+tEwx8Bn6a9jPKG+Y=', 'x-amz-request-id': '1JDKPM0Z786F0YAR', 'Date': 'Fri, 11 Nov 2022 01:14:18 GMT', 'ETag': '"bf4b2ba7a25db524c700ec1b6c837a56"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180806T000000, start_date=20221111T011415, end_date=20221111T011419 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-08-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:14:19.772561Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ddfbc639-2e32-4814-a184-086db496ef3b"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..68df436b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:14:03.464880Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a7d8269b-06b9-3fed-875a-a1326f6e3532"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a7d8269b-06b9-3fed-875a-a1326f6e3532"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2c766584-6bf8-470e-a7c1-4b490bbe0875"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-08-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:14:03.464880+00:00, try_number=1, job_id=1005, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-06 00:00:00+00:00 +INFO - Started process 8355 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-08-06T00:00:00+00:00', '--job-id', '1005', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpjo6yzx9c'] +INFO - Job 1005: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f6249951550> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011405Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011405Z +20221111/us-east-1/s3/aws4_request +a93a3b69381a328d914e737f3d2bec55f782c75cdf678710f4d4a46acdceebb1 +INFO - '2022-11-11' - botocore.auth - Signature: +8699360ffbecf1cdd77322e4fe03f8b2c2c69350b505189629a2e9283342b389 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '0d1GN520X72RLFugp4TqoB17d3sfshZgX8qVFDhb1F9yQDQ3XRQmFeoZh/38Q4boemBdvVaYD5Y=', 'x-amz-request-id': 'DWBGH4TAW986B4CN', 'Date': 'Fri, 11 Nov 2022 01:14:06 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180806T000000, start_date=20221111T011403, end_date=20221111T011407 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-08-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:14:07.517125Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2c766584-6bf8-470e-a7c1-4b490bbe0875"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..7f90bdcc --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:13:53.382245Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a7d8269b-06b9-3fed-875a-a1326f6e3532"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a7d8269b-06b9-3fed-875a-a1326f6e3532"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e1cca47f-99ae-4012-bb64-e1b621dae957"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-08-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:13:53.382245+00:00, try_number=1, job_id=1003, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-06 00:00:00+00:00 +INFO - Started process 8350 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-08-06T00:00:00+00:00', '--job-id', '1003', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpr1d1tpie'] +INFO - Job 1003: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180806T000000, start_date=20221111T011353, end_date=20221111T011411 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-08-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:14:11.732246Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e1cca47f-99ae-4012-bb64-e1b621dae957"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..0e3e7a66 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-06T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:13:53.347768Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-06T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a7d8269b-06b9-3fed-875a-a1326f6e3532"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "a7d8269b-06b9-3fed-875a-a1326f6e3532"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d0c9ffa0-8991-45a8-a40d-023e2cda44c4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-08-06T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:13:53.347768+00:00, try_number=1, job_id=1004, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-06 00:00:00+00:00 +INFO - Started process 8348 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-08-06T00:00:00+00:00', '--job-id', '1004', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp46npvyeo'] +INFO - Job 1004: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-06T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-06T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180806T000000, start_date=20221111T011353, end_date=20221111T011358 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-08-06T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:13:58.716376Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d0c9ffa0-8991-45a8-a40d-023e2cda44c4"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..8774c6ab --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:14:25.386197Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "187506e6-4e0b-3b9b-97ea-6d085408c21e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "187506e6-4e0b-3b9b-97ea-6d085408c21e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "17cbb0e1-bebb-4ea6-a558-9acb9d5a0de0"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-08-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:14:25.386197+00:00, try_number=1, job_id=1007, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-07 00:00:00+00:00 +INFO - Started process 8210 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-08-07T00:00:00+00:00', '--job-id', '1007', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp9b2efo4n'] +INFO - Job 1007: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180807T000000, start_date=20221111T011425, end_date=20221111T011430 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-08-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:14:30.517698Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "17cbb0e1-bebb-4ea6-a558-9acb9d5a0de0"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..2875f935 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:14:25.447792Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "187506e6-4e0b-3b9b-97ea-6d085408c21e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "187506e6-4e0b-3b9b-97ea-6d085408c21e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "85945b18-9e4a-4041-bb42-0d9cdd0d5b8c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-08-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:14:25.447792+00:00, try_number=1, job_id=1008, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-07 00:00:00+00:00 +INFO - Started process 8212 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-08-07T00:00:00+00:00', '--job-id', '1008', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpdowi4rz4'] +INFO - Job 1008: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180807T000000, start_date=20221111T011425, end_date=20221111T011431 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-08-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:14:31.115338Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "85945b18-9e4a-4041-bb42-0d9cdd0d5b8c"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..55d72c52 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:14:56.409898Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "187506e6-4e0b-3b9b-97ea-6d085408c21e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "187506e6-4e0b-3b9b-97ea-6d085408c21e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "767e0cc4-8504-42de-a26c-7eca85015c7e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-08-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:14:56.409898+00:00, try_number=1, job_id=1012, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-07 00:00:00+00:00 +INFO - Started process 8375 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-08-07T00:00:00+00:00', '--job-id', '1012', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmprrht8yfg'] +INFO - Job 1012: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0ee0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'v0srp6JdtSTHAOwbbIN6Vg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:v0srp6JdtSTHAOwbbIN6Vg== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011458Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011458Z +20221111/us-east-1/s3/aws4_request +766b31f1f16faae7a6cbc29d26ffeaf64286a5acf06e12bf24a28a0f0dd87732 +INFO - '2022-11-11' - botocore.auth - Signature: +5b1f7494099af1fb00e180369cd58746d15810df73e2a98c31c70020c226e190 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'uas5OlRsIA7CS3yhmtTd8nAOCwPJeRny8q51qvR3ugh46iWdEAIhgQqYULsnmZi0WgHnsLjwJYk=', 'x-amz-request-id': 'K58HXTDRTS72M7AF', 'Date': 'Fri, 11 Nov 2022 01:14:59 GMT', 'ETag': '"bf4b2ba7a25db524c700ec1b6c837a56"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180807T000000, start_date=20221111T011456, end_date=20221111T011500 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-08-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:15:00.784568Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "767e0cc4-8504-42de-a26c-7eca85015c7e"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..f8d691bc --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:14:43.909645Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "187506e6-4e0b-3b9b-97ea-6d085408c21e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "187506e6-4e0b-3b9b-97ea-6d085408c21e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "30dfa68c-bd16-4b6f-837d-f8d1a54df0e1"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-08-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:14:43.909645+00:00, try_number=1, job_id=1011, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-07 00:00:00+00:00 +INFO - Started process 8227 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-08-07T00:00:00+00:00', '--job-id', '1011', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpatkq1l3q'] +INFO - Job 1011: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50071f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011446Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011446Z +20221111/us-east-1/s3/aws4_request +0155c9eb45870a87866ea38952b5b88ca7fbcccb06a2f9fc7e38e7288bfb6e15 +INFO - '2022-11-11' - botocore.auth - Signature: +86f0688dbb601f960e31a3a070049ccfe2abdad19a031308db9444d6e6543ff3 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'wJBkRADx+kalEcRTI3uWebrSVWUq1LK2qKmdggbKhepsH7soUYBW/dDRYlLvN0BGoixdgYXHCA4=', 'x-amz-request-id': 'BMTT7CJSD1WMCJTQ', 'Date': 'Fri, 11 Nov 2022 01:14:47 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180807T000000, start_date=20221111T011443, end_date=20221111T011448 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-08-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:14:48.418176Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "30dfa68c-bd16-4b6f-837d-f8d1a54df0e1"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..c6ecdee5 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:14:34.694204Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "187506e6-4e0b-3b9b-97ea-6d085408c21e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "187506e6-4e0b-3b9b-97ea-6d085408c21e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2901cad1-f1b5-46ae-8fdb-55705bc5f8ef"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-08-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:14:34.694204+00:00, try_number=1, job_id=1009, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-07 00:00:00+00:00 +INFO - Started process 8219 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-08-07T00:00:00+00:00', '--job-id', '1009', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpzfg53wg4'] +INFO - Job 1009: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180807T000000, start_date=20221111T011434, end_date=20221111T011451 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-08-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:14:51.271239Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2901cad1-f1b5-46ae-8fdb-55705bc5f8ef"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..394c42d1 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-07T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:14:35.180053Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-07T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "187506e6-4e0b-3b9b-97ea-6d085408c21e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "187506e6-4e0b-3b9b-97ea-6d085408c21e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c20999b4-7070-4585-b0a1-e7b7005963bd"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-08-07T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:14:35.180053+00:00, try_number=1, job_id=1010, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-07 00:00:00+00:00 +INFO - Started process 8222 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-08-07T00:00:00+00:00', '--job-id', '1010', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpg_9lxfw_'] +INFO - Job 1010: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-07T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-07T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180807T000000, start_date=20221111T011435, end_date=20221111T011440 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-08-07T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:14:40.098389Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c20999b4-7070-4585-b0a1-e7b7005963bd"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..ced41762 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:15:05.798932Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0d6bfa69-fd28-33ad-a937-c7581869895f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0d6bfa69-fd28-33ad-a937-c7581869895f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fb630476-aa79-458d-907a-c45636592cd3"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-08-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:15:05.798932+00:00, try_number=1, job_id=1014, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-08 00:00:00+00:00 +INFO - Started process 8386 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-08-08T00:00:00+00:00', '--job-id', '1014', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpbx605gko'] +INFO - Job 1014: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180808T000000, start_date=20221111T011505, end_date=20221111T011510 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-08-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:15:10.122234Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fb630476-aa79-458d-907a-c45636592cd3"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..665c71d0 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:15:05.672701Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0d6bfa69-fd28-33ad-a937-c7581869895f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0d6bfa69-fd28-33ad-a937-c7581869895f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6a34a3e3-f0b5-4288-8998-b47ed7191c23"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-08-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:15:05.672701+00:00, try_number=1, job_id=1013, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-08 00:00:00+00:00 +INFO - Started process 8383 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-08-08T00:00:00+00:00', '--job-id', '1013', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp9goy0v3i'] +INFO - Job 1013: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180808T000000, start_date=20221111T011505, end_date=20221111T011510 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-08-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:15:10.859579Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6a34a3e3-f0b5-4288-8998-b47ed7191c23"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..ae330c69 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:15:36.215270Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0d6bfa69-fd28-33ad-a937-c7581869895f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0d6bfa69-fd28-33ad-a937-c7581869895f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "34b54e04-5904-465e-842c-a07bb70cdbc4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-08-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:15:36.215270+00:00, try_number=1, job_id=1018, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-08 00:00:00+00:00 +INFO - Started process 8252 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-08-08T00:00:00+00:00', '--job-id', '1018', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpij1efan2'] +INFO - Job 1018: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6ee0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'qnmKngo5nvxjR5m5MwK24A==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:qnmKngo5nvxjR5m5MwK24A== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011538Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011538Z +20221111/us-east-1/s3/aws4_request +9cc887bb270472da5a89d7f0b9b5cbe6d9e95120cc210ec5bfcc6a460bf75d55 +INFO - '2022-11-11' - botocore.auth - Signature: +b3a9fb8bb026ea49c9171eb8a7de6645bab42478ca51f5a33cdb5acfd7ff4c44 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'sn73Gz9qgPMgUBtuWOsYDlWIJhDbR6GWnptOr7i/q+R0AY7aAYkl2Tg7zkrV8W8ifE/1i2Hh2Ac=', 'x-amz-request-id': '5J346HJSA8DCG5QH', 'Date': 'Fri, 11 Nov 2022 01:15:39 GMT', 'ETag': '"aa798a9e0a399efc634799b93302b6e0"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180808T000000, start_date=20221111T011536, end_date=20221111T011539 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-08-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:15:39.954618Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "34b54e04-5904-465e-842c-a07bb70cdbc4"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..1728ea53 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:15:25.970548Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0d6bfa69-fd28-33ad-a937-c7581869895f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0d6bfa69-fd28-33ad-a937-c7581869895f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6e7ecd12-89de-4349-8570-cb3f9f24e71b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-08-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:15:25.970548+00:00, try_number=1, job_id=1017, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-08 00:00:00+00:00 +INFO - Started process 8245 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-08-08T00:00:00+00:00', '--job-id', '1017', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp5_w46br8'] +INFO - Job 1017: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50063a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011528Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011528Z +20221111/us-east-1/s3/aws4_request +144940b2e4fc4a506c82a31d02a64288f167c6c770ef4edee0592bac2e810ac7 +INFO - '2022-11-11' - botocore.auth - Signature: +a8ed6bda5de2fb2adc5abfb6fa61bf708f28a553345f153039cb859ab64bc05c +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'OBM7LRu4cFZGD/a6MmpDJBxa3hghRHkJiCMJAUP9qT91ajt9q7tzjhmncLdJHXw00IQSn5rNXoU=', 'x-amz-request-id': '4Q5K7WZFYD00DF40', 'Date': 'Fri, 11 Nov 2022 01:15:28 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180808T000000, start_date=20221111T011525, end_date=20221111T011529 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-08-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:15:29.817874Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6e7ecd12-89de-4349-8570-cb3f9f24e71b"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..baed6d81 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:15:15.284585Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0d6bfa69-fd28-33ad-a937-c7581869895f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0d6bfa69-fd28-33ad-a937-c7581869895f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "72c09037-b541-45dd-8b4e-19c49ec6cd5c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-08-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:15:15.284585+00:00, try_number=1, job_id=1016, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-08 00:00:00+00:00 +INFO - Started process 8392 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-08-08T00:00:00+00:00', '--job-id', '1016', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp1ocn6owx'] +INFO - Job 1016: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180808T000000, start_date=20221111T011515, end_date=20221111T011531 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-08-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:15:31.539117Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "72c09037-b541-45dd-8b4e-19c49ec6cd5c"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..0a1e79a4 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-08T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:15:15.224168Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-08T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0d6bfa69-fd28-33ad-a937-c7581869895f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "0d6bfa69-fd28-33ad-a937-c7581869895f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8e8a254b-6d55-46de-b530-b50252c8951d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-08-08T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:15:15.224168+00:00, try_number=1, job_id=1015, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-08 00:00:00+00:00 +INFO - Started process 8240 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-08-08T00:00:00+00:00', '--job-id', '1015', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmphixkde0m'] +INFO - Job 1015: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-08T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-08T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180808T000000, start_date=20221111T011515, end_date=20221111T011520 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-08-08T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:15:20.806177Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8e8a254b-6d55-46de-b530-b50252c8951d"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..2ff4caa8 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:15:46.423873Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d5aa7942-e948-36a6-8516-9c12d1af0597"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d5aa7942-e948-36a6-8516-9c12d1af0597"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "54039585-20b4-45e3-ba3b-2e9858c6f8f0"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-08-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:15:46.423873+00:00, try_number=1, job_id=1019, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-09 00:00:00+00:00 +INFO - Started process 8404 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-08-09T00:00:00+00:00', '--job-id', '1019', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmphn385eeo'] +INFO - Job 1019: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180809T000000, start_date=20221111T011546, end_date=20221111T011551 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-08-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:15:51.327201Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "54039585-20b4-45e3-ba3b-2e9858c6f8f0"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..70bb88bb --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:15:46.473071Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d5aa7942-e948-36a6-8516-9c12d1af0597"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d5aa7942-e948-36a6-8516-9c12d1af0597"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0e053132-5942-441f-b995-1629d8a74605"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-08-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:15:46.473071+00:00, try_number=1, job_id=1020, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-09 00:00:00+00:00 +INFO - Started process 8406 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-08-09T00:00:00+00:00', '--job-id', '1020', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmptvdhgauw'] +INFO - Job 1020: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180809T000000, start_date=20221111T011546, end_date=20221111T011551 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-08-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:15:51.330354Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0e053132-5942-441f-b995-1629d8a74605"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..c734ff97 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:16:20.977275Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d5aa7942-e948-36a6-8516-9c12d1af0597"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d5aa7942-e948-36a6-8516-9c12d1af0597"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "42286867-7388-47a5-a124-d7151abbaaf3"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-08-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:16:20.977275+00:00, try_number=1, job_id=1024, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-09 00:00:00+00:00 +INFO - Started process 8434 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-08-09T00:00:00+00:00', '--job-id', '1024', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmprnzkon2h'] +INFO - Job 1024: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f1ee0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'r4B8aA6xD5dZYLnmxlOz5w==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:r4B8aA6xD5dZYLnmxlOz5w== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011622Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011622Z +20221111/us-east-1/s3/aws4_request +a45c87468f89e8f5df7096d45061cda792a62772513ff64f4925c5cbe2f76e7b +INFO - '2022-11-11' - botocore.auth - Signature: +4b708d1cd86102a599ae04708e584c4dd3fc5f0eee941bcb472b2ce158f002c4 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'dWaEiNmGnaRhuMqV1Z6/s6GH+3WZrl/bVBkl4ZDatAM/GQpFzZtGSBrXLWezuz1o0cIuf+2Gg/Y=', 'x-amz-request-id': 'ZZZ4CNF801J03K19', 'Date': 'Fri, 11 Nov 2022 01:16:23 GMT', 'ETag': '"af807c680eb10f975960b9e6c653b3e7"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180809T000000, start_date=20221111T011620, end_date=20221111T011624 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-08-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:16:24.267246Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "42286867-7388-47a5-a124-d7151abbaaf3"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..baef1458 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:16:07.626425Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d5aa7942-e948-36a6-8516-9c12d1af0597"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d5aa7942-e948-36a6-8516-9c12d1af0597"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f56b46e9-c10d-4769-a68e-c79e974d9325"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-08-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:16:07.626425+00:00, try_number=1, job_id=1023, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-09 00:00:00+00:00 +INFO - Started process 8421 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-08-09T00:00:00+00:00', '--job-id', '1023', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpotc8o0bn'] +INFO - Job 1023: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499521f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011609Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011609Z +20221111/us-east-1/s3/aws4_request +2a160a5fe39d2867dc6776d7d9887e1b85d0dcdc227a73fd6e3d22173d216f9f +INFO - '2022-11-11' - botocore.auth - Signature: +a239004f4ab6f946519ca1908fd1d2aaf13f88f348c811978d6387ff9c6ef2c5 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'MkSo1/MxZ+km1DkFDiOjpViSzBygGqjwPln4gekczoJYN2u0UoG1gT2AMm8qr/E9No3nSCuIRhk=', 'x-amz-request-id': 'NM0PJB74WDD52WKN', 'Date': 'Fri, 11 Nov 2022 01:16:09 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180809T000000, start_date=20221111T011607, end_date=20221111T011610 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-08-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:16:10.613646Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f56b46e9-c10d-4769-a68e-c79e974d9325"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..1251a328 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:15:57.257262Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d5aa7942-e948-36a6-8516-9c12d1af0597"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d5aa7942-e948-36a6-8516-9c12d1af0597"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "32b70f85-792d-47cf-9e71-f1dfb6027b0c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-08-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:15:57.257262+00:00, try_number=1, job_id=1022, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-09 00:00:00+00:00 +INFO - Started process 8416 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-08-09T00:00:00+00:00', '--job-id', '1022', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp0tqikx4m'] +INFO - Job 1022: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180809T000000, start_date=20221111T011557, end_date=20221111T011615 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-08-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:16:15.212102Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "32b70f85-792d-47cf-9e71-f1dfb6027b0c"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..76a77c4c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-09T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:15:57.074911Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-09T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d5aa7942-e948-36a6-8516-9c12d1af0597"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d5aa7942-e948-36a6-8516-9c12d1af0597"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d1489cab-3a3b-4ba7-8620-26c2424bc838"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-08-09T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:15:57.074911+00:00, try_number=1, job_id=1021, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-09 00:00:00+00:00 +INFO - Started process 8414 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-08-09T00:00:00+00:00', '--job-id', '1021', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpf5irjlk9'] +INFO - Job 1021: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-09T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-09T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180809T000000, start_date=20221111T011557, end_date=20221111T011602 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-08-09T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:16:02.059384Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d1489cab-3a3b-4ba7-8620-26c2424bc838"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..b3577c5e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:16:29.841099Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3179f6be-10a6-3ca0-a90c-2ae51c7dcf10"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3179f6be-10a6-3ca0-a90c-2ae51c7dcf10"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f2606a66-ec1f-414b-829a-38512eebff8c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-08-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:16:29.841099+00:00, try_number=1, job_id=1026, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-10 00:00:00+00:00 +INFO - Started process 8268 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-08-10T00:00:00+00:00', '--job-id', '1026', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpcbbcy9as'] +INFO - Job 1026: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180810T000000, start_date=20221111T011629, end_date=20221111T011635 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-08-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:16:35.002743Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f2606a66-ec1f-414b-829a-38512eebff8c"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..2acdc628 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:16:29.123519Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3179f6be-10a6-3ca0-a90c-2ae51c7dcf10"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3179f6be-10a6-3ca0-a90c-2ae51c7dcf10"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fe75b724-ecb4-4128-8621-2691e24df0aa"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-08-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:16:29.123519+00:00, try_number=1, job_id=1025, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-10 00:00:00+00:00 +INFO - Started process 8265 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-08-10T00:00:00+00:00', '--job-id', '1025', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp638ts4i9'] +INFO - Job 1025: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180810T000000, start_date=20221111T011629, end_date=20221111T011634 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-08-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:16:34.509637Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fe75b724-ecb4-4128-8621-2691e24df0aa"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..57df953f --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:17:00.884714Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3179f6be-10a6-3ca0-a90c-2ae51c7dcf10"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3179f6be-10a6-3ca0-a90c-2ae51c7dcf10"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "41c467a0-0777-45ad-b42b-31ee84c16df2"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-08-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:17:00.884714+00:00, try_number=1, job_id=1030, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-10 00:00:00+00:00 +INFO - Started process 8296 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-08-10T00:00:00+00:00', '--job-id', '1030', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp8phaup0n'] +INFO - Job 1030: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6ee0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'On0JkIAo3XrzazR0H5cm2A==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:On0JkIAo3XrzazR0H5cm2A== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011702Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011702Z +20221111/us-east-1/s3/aws4_request +e775e5551a89264f6dc152ff2088dd9ca6b314f0bbec42f1ce4fb687fd89d4ee +INFO - '2022-11-11' - botocore.auth - Signature: +e5fd42940f6e8bfca72f0d47d90957c9fd0ddf4051edbd2c4b53b63d8668e7ed +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'u+o78ao8eEwEEMQ1XXarWtklmsanzP4r4E4iysYyVp9ts1bGhleddNCkhesuDgHp0eMoZFE4RXc=', 'x-amz-request-id': 'YHZTP8WRRNEJCQFW', 'Date': 'Fri, 11 Nov 2022 01:17:03 GMT', 'ETag': '"3a7d09908028dd7af36b34741f9726d8"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180810T000000, start_date=20221111T011700, end_date=20221111T011704 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-08-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:17:04.072076Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "41c467a0-0777-45ad-b42b-31ee84c16df2"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..70e46a5d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:16:48.730698Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3179f6be-10a6-3ca0-a90c-2ae51c7dcf10"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3179f6be-10a6-3ca0-a90c-2ae51c7dcf10"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d43e3868-3089-463f-8335-7e544e7c8250"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-08-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:16:48.730698+00:00, try_number=1, job_id=1029, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-10 00:00:00+00:00 +INFO - Started process 8283 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-08-10T00:00:00+00:00', '--job-id', '1029', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpuvtn6dku'] +INFO - Job 1029: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50081f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011650Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011650Z +20221111/us-east-1/s3/aws4_request +618c8e5d3555f0db90d475307a83d75c224bf29a196d7ecee4ae1e0e31f52ea9 +INFO - '2022-11-11' - botocore.auth - Signature: +6eb253ba98354497103413aec416d7ed3a67b323fd36c440d53e0d5019d7b127 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'v4vt9lwAyvx8+4xerlLmw2w8d10HRJIqKVOCOh+3tTgV8b1KXGzBOAZSK3PD6NrsRMar81FTPqc=', 'x-amz-request-id': 'KNB4VG9RSP173TV9', 'Date': 'Fri, 11 Nov 2022 01:16:51 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180810T000000, start_date=20221111T011648, end_date=20221111T011652 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-08-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:16:52.730338Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d43e3868-3089-463f-8335-7e544e7c8250"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..1bfb07f7 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:16:38.992390Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3179f6be-10a6-3ca0-a90c-2ae51c7dcf10"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3179f6be-10a6-3ca0-a90c-2ae51c7dcf10"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "43371af6-ab19-4680-9edb-415912aa9b87"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-08-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:16:38.992390+00:00, try_number=1, job_id=1027, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-10 00:00:00+00:00 +INFO - Started process 8275 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-08-10T00:00:00+00:00', '--job-id', '1027', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpbffbjrcf'] +INFO - Job 1027: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180810T000000, start_date=20221111T011638, end_date=20221111T011657 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-08-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:16:57.626997Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "43371af6-ab19-4680-9edb-415912aa9b87"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..defabb2e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-10T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:16:39.798642Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-10T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3179f6be-10a6-3ca0-a90c-2ae51c7dcf10"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3179f6be-10a6-3ca0-a90c-2ae51c7dcf10"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ab9fc6b7-2a17-4ff1-856b-fcbf23f4af9b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-08-10T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:16:39.798642+00:00, try_number=1, job_id=1028, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-10 00:00:00+00:00 +INFO - Started process 8278 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-08-10T00:00:00+00:00', '--job-id', '1028', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpjeyckk1m'] +INFO - Job 1028: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-10T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-10T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180810T000000, start_date=20221111T011639, end_date=20221111T011644 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-08-10T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:16:44.479550Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ab9fc6b7-2a17-4ff1-856b-fcbf23f4af9b"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..71339298 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:17:08.590974Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d7ab9931-8b6d-3681-8674-2ecc41954514"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d7ab9931-8b6d-3681-8674-2ecc41954514"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0280cd9e-1b7c-4988-b38d-18aa2d13543f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-08-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:17:08.590974+00:00, try_number=1, job_id=1031, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-11 00:00:00+00:00 +INFO - Started process 8304 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-08-11T00:00:00+00:00', '--job-id', '1031', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp0tmwnfc_'] +INFO - Job 1031: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180811T000000, start_date=20221111T011708, end_date=20221111T011713 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-08-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:17:13.142756Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0280cd9e-1b7c-4988-b38d-18aa2d13543f"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..3b142c29 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:17:10.219369Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d7ab9931-8b6d-3681-8674-2ecc41954514"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d7ab9931-8b6d-3681-8674-2ecc41954514"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "691fc55f-4b1b-4a57-830d-a281c3ea391a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-08-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:17:10.219369+00:00, try_number=1, job_id=1032, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-11 00:00:00+00:00 +INFO - Started process 8307 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-08-11T00:00:00+00:00', '--job-id', '1032', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpy4d6n4xi'] +INFO - Job 1032: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180811T000000, start_date=20221111T011710, end_date=20221111T011714 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-08-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:17:14.166935Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "691fc55f-4b1b-4a57-830d-a281c3ea391a"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..bb14271e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:17:36.881933Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d7ab9931-8b6d-3681-8674-2ecc41954514"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d7ab9931-8b6d-3681-8674-2ecc41954514"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "625bb6c8-8dde-4436-bf17-c11221b249f5"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-08-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:17:36.881933+00:00, try_number=1, job_id=1036, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-11 00:00:00+00:00 +INFO - Started process 8463 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-08-11T00:00:00+00:00', '--job-id', '1036', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpz7y04c58'] +INFO - Job 1036: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f2ee0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'LMG+k/+cgY/gKhWdwtvM0g==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:LMG+k/+cgY/gKhWdwtvM0g== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011739Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011739Z +20221111/us-east-1/s3/aws4_request +67bb7ae2df29a7a1af2315889c081bf15f799e1b3280774bf7c4bd64312d3f8a +INFO - '2022-11-11' - botocore.auth - Signature: +80daba86c676934f9e81bd1cbd91563ff971877a308a6172b9402f7a214c7834 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'M1pI03hozHS/sl/rIDi1tvUcVwoItyLtqzBrMCZX4osL89vXYgPZwiF068V7KZbzvvzBbIYydqE=', 'x-amz-request-id': 'TQPY9T5D47NT5FHZ', 'Date': 'Fri, 11 Nov 2022 01:17:40 GMT', 'ETag': '"2cc1be93ff9c818fe02a159dc2dbccd2"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180811T000000, start_date=20221111T011736, end_date=20221111T011741 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-08-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:17:41.301803Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "625bb6c8-8dde-4436-bf17-c11221b249f5"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..86baf46c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:17:29.082293Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d7ab9931-8b6d-3681-8674-2ecc41954514"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d7ab9931-8b6d-3681-8674-2ecc41954514"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9c7b0f3a-9afa-4805-8238-8069799eb642"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-08-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:17:29.082293+00:00, try_number=1, job_id=1035, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-11 00:00:00+00:00 +INFO - Started process 8455 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-08-11T00:00:00+00:00', '--job-id', '1035', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpa_q9in0d'] +INFO - Job 1035: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499521f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011731Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011731Z +20221111/us-east-1/s3/aws4_request +f6967a668a3f5bf508f13aaf4b22c316a484f32b8897723292c43eb23223cbb1 +INFO - '2022-11-11' - botocore.auth - Signature: +379be81696cbd80b1e30d69365a74c1000320e465d2b03dd03625ae43964ad2f +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'HWiZKCXVZhef8DYV3CBzksJnQyda+o+FQmW5nBbc6RxtFbFNMs7u4/SRQkR7jY+RulUlM7m3Gcs=', 'x-amz-request-id': 'KM95W40DEFF2PCG0', 'Date': 'Fri, 11 Nov 2022 01:17:31 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180811T000000, start_date=20221111T011729, end_date=20221111T011732 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-08-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:17:32.853320Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9c7b0f3a-9afa-4805-8238-8069799eb642"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..c3d4025d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:17:16.277393Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d7ab9931-8b6d-3681-8674-2ecc41954514"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d7ab9931-8b6d-3681-8674-2ecc41954514"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4962447f-4a07-4486-a541-b055b375242c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-08-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:17:16.277393+00:00, try_number=1, job_id=1033, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-11 00:00:00+00:00 +INFO - Started process 8447 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-08-11T00:00:00+00:00', '--job-id', '1033', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp7hl_twze'] +INFO - Job 1033: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180811T000000, start_date=20221111T011716, end_date=20221111T011732 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-08-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:17:32.739448Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4962447f-4a07-4486-a541-b055b375242c"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..37d30c32 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-11T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:17:18.522665Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-11T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d7ab9931-8b6d-3681-8674-2ecc41954514"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "d7ab9931-8b6d-3681-8674-2ecc41954514"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f6c24a7b-4179-4e62-b6d9-a821616015e5"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-08-11T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:17:18.522665+00:00, try_number=1, job_id=1034, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-11 00:00:00+00:00 +INFO - Started process 8450 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-08-11T00:00:00+00:00', '--job-id', '1034', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp7wmlhbfu'] +INFO - Job 1034: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-11T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-11T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180811T000000, start_date=20221111T011718, end_date=20221111T011725 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-08-11T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:17:25.044118Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f6c24a7b-4179-4e62-b6d9-a821616015e5"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..93a28ca7 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:17:46.578588Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "598b41f2-63d0-37ba-a3d5-f1e156db120a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "598b41f2-63d0-37ba-a3d5-f1e156db120a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "da76d18f-bfee-47b3-b65d-90166d8abced"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-08-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:17:46.578588+00:00, try_number=1, job_id=1037, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-12 00:00:00+00:00 +INFO - Started process 8472 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-08-12T00:00:00+00:00', '--job-id', '1037', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpwi28ezna'] +INFO - Job 1037: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180812T000000, start_date=20221111T011746, end_date=20221111T011751 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-08-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:17:51.128510Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "da76d18f-bfee-47b3-b65d-90166d8abced"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..b868f184 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:17:46.614834Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "598b41f2-63d0-37ba-a3d5-f1e156db120a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "598b41f2-63d0-37ba-a3d5-f1e156db120a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6f3c57b8-97fc-438a-9f42-5dc321e774e9"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-08-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:17:46.614834+00:00, try_number=1, job_id=1038, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-12 00:00:00+00:00 +INFO - Started process 8474 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-08-12T00:00:00+00:00', '--job-id', '1038', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpm8z7n_ym'] +INFO - Job 1038: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180812T000000, start_date=20221111T011746, end_date=20221111T011751 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-08-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:17:51.344207Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6f3c57b8-97fc-438a-9f42-5dc321e774e9"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..7538258e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:18:15.319483Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "598b41f2-63d0-37ba-a3d5-f1e156db120a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "598b41f2-63d0-37ba-a3d5-f1e156db120a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c44187e4-bdc8-452f-9c65-25c1c739e715"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-08-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:18:15.319483+00:00, try_number=1, job_id=1042, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-12 00:00:00+00:00 +INFO - Started process 8490 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-08-12T00:00:00+00:00', '--job-id', '1042', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpft8jb7cr'] +INFO - Job 1042: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f1ca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '7oGHBHHsweQebwyzR/esTg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:7oGHBHHsweQebwyzR/esTg== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011817Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011817Z +20221111/us-east-1/s3/aws4_request +900d09d4e94df60ab97e04f065841d7fbedfce4ce0fcb81897cffdf0866496ce +INFO - '2022-11-11' - botocore.auth - Signature: +3e55cde6f62d90ecb6f2e81e3e50ede95efe7210d4401d6c35c3a929a60883c3 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'lXsixbanqrHG1bm+0U4yCkE7rm3lfYpOvI/bZw1IAiXp5w/BHh17Rqvex4JHbz7gVDGNz77UKkE=', 'x-amz-request-id': 'TZ547PQZKP4YQ1GW', 'Date': 'Fri, 11 Nov 2022 01:18:18 GMT', 'ETag': '"ee81870471ecc1e41e6f0cb347f7ac4e"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180812T000000, start_date=20221111T011815, end_date=20221111T011819 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-08-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:18:19.122321Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c44187e4-bdc8-452f-9c65-25c1c739e715"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..4a1a1851 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:18:07.027863Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "598b41f2-63d0-37ba-a3d5-f1e156db120a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "598b41f2-63d0-37ba-a3d5-f1e156db120a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5277dac8-bdfb-45e9-a4b4-e137c104a403"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-08-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:18:07.027863+00:00, try_number=1, job_id=1041, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-12 00:00:00+00:00 +INFO - Started process 8323 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-08-12T00:00:00+00:00', '--job-id', '1041', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp4snz1ej_'] +INFO - Job 1041: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50083a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011809Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011809Z +20221111/us-east-1/s3/aws4_request +38863155dd8152cb6921f3270176b4a90d1fc50185b566901028fb90ca9267f9 +INFO - '2022-11-11' - botocore.auth - Signature: +2d4850a3e6dfd667843ff3c145fffff0df81e54b273d648f561a8d3ab86adfbe +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'UH3q+OS0EUdQMs9LEA8wzYuIyada+PZ3Q3PH4ly2GLN/Jz1sFDd4teDXfeIBxh+bhVlAuQoBFPI=', 'x-amz-request-id': 'MZ5HCH5K74A62DT7', 'Date': 'Fri, 11 Nov 2022 01:18:10 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180812T000000, start_date=20221111T011807, end_date=20221111T011811 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-08-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:18:11.420891Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5277dac8-bdfb-45e9-a4b4-e137c104a403"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..3712473c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:17:56.494913Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "598b41f2-63d0-37ba-a3d5-f1e156db120a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "598b41f2-63d0-37ba-a3d5-f1e156db120a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fa113336-76f9-4569-b9f2-e2ecef5fe306"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-08-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:17:56.494913+00:00, try_number=1, job_id=1040, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-12 00:00:00+00:00 +INFO - Started process 8480 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-08-12T00:00:00+00:00', '--job-id', '1040', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpf0tbu5wv'] +INFO - Job 1040: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180812T000000, start_date=20221111T011756, end_date=20221111T011811 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-08-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:18:11.812678Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fa113336-76f9-4569-b9f2-e2ecef5fe306"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..3b8bc322 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-12T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:17:56.353603Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-12T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "598b41f2-63d0-37ba-a3d5-f1e156db120a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "598b41f2-63d0-37ba-a3d5-f1e156db120a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "afbc3aa3-6c50-48a2-b305-5530fc22280c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-08-12T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:17:56.353603+00:00, try_number=1, job_id=1039, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-12 00:00:00+00:00 +INFO - Started process 8318 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-08-12T00:00:00+00:00', '--job-id', '1039', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpu8kv_smp'] +INFO - Job 1039: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-12T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-12T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180812T000000, start_date=20221111T011756, end_date=20221111T011801 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-08-12T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:18:01.132599Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "afbc3aa3-6c50-48a2-b305-5530fc22280c"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..3a252027 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:18:22.822043Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51199c50-abfc-393e-97cd-4cf94f66dabc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51199c50-abfc-393e-97cd-4cf94f66dabc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "054eae19-3567-4c7a-89cc-e1cccecd1000"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-08-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:18:22.822043+00:00, try_number=1, job_id=1043, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-13 00:00:00+00:00 +INFO - Started process 8331 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-08-13T00:00:00+00:00', '--job-id', '1043', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpqmroce44'] +INFO - Job 1043: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180813T000000, start_date=20221111T011822, end_date=20221111T011828 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-08-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:18:28.009217Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "054eae19-3567-4c7a-89cc-e1cccecd1000"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..1c15b4f3 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:18:22.912144Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51199c50-abfc-393e-97cd-4cf94f66dabc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51199c50-abfc-393e-97cd-4cf94f66dabc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8e746c78-3c28-4be1-ad1f-d9212930e22a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-08-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:18:22.912144+00:00, try_number=1, job_id=1044, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-13 00:00:00+00:00 +INFO - Started process 8334 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-08-13T00:00:00+00:00', '--job-id', '1044', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp8e7ckue4'] +INFO - Job 1044: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180813T000000, start_date=20221111T011822, end_date=20221111T011827 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-08-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:18:27.836168Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8e746c78-3c28-4be1-ad1f-d9212930e22a"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..f6d7e7bf --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:18:53.647163Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51199c50-abfc-393e-97cd-4cf94f66dabc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51199c50-abfc-393e-97cd-4cf94f66dabc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e8eae342-6a04-4b90-aece-750e2bf5edc9"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-08-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:18:53.647163+00:00, try_number=1, job_id=1048, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-13 00:00:00+00:00 +INFO - Started process 8519 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-08-13T00:00:00+00:00', '--job-id', '1048', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpcv9fgepa'] +INFO - Job 1048: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'GVUGtJ/Ijtllnm4m9syzmw==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:GVUGtJ/Ijtllnm4m9syzmw== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011855Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011855Z +20221111/us-east-1/s3/aws4_request +2f33ea29dc49a396b9e39ee2338fb88eed76469b38031deca9fd896f0039309d +INFO - '2022-11-11' - botocore.auth - Signature: +bf03b7877eed7d18adc2a631326ec2a0b30d1723e63e31dd99668d3efa2285ef +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'BYq5PsPsvu0+AQeZWOvLNrEdSU9mEZtIT2CFESgvmcVxyoDgW2R12lzgXGbeqJfxUgGL122aFSw=', 'x-amz-request-id': 'Q5YQ6GHHE71N5S8Z', 'Date': 'Fri, 11 Nov 2022 01:18:55 GMT', 'ETag': '"195506b49fc88ed9659e6e26f6ccb39b"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180813T000000, start_date=20221111T011853, end_date=20221111T011856 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-08-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:18:56.686672Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e8eae342-6a04-4b90-aece-750e2bf5edc9"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..f9b39415 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:18:42.363960Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51199c50-abfc-393e-97cd-4cf94f66dabc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51199c50-abfc-393e-97cd-4cf94f66dabc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2c17f268-c350-49f9-ac08-cf7e5a985eef"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-08-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:18:42.363960+00:00, try_number=1, job_id=1047, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-13 00:00:00+00:00 +INFO - Started process 8506 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-08-13T00:00:00+00:00', '--job-id', '1047', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpzwrx2rxe'] +INFO - Job 1047: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499523a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011845Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011845Z +20221111/us-east-1/s3/aws4_request +cc01214b50723faefaad46d65a15649682094753143a1e33c0ba9f4e9625861c +INFO - '2022-11-11' - botocore.auth - Signature: +8e35eeb149e6fc24366b77cdb418b4df3bccff8c4cc4f5e25c466c0cabe9babd +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': '3UK27uIXZV5pD+dWMiyyC9YkEC0SxxguO4EDJVV7Pd6RiF2vmtHAEZaySD/MoPy9N42uoWrWKyk=', 'x-amz-request-id': 'R2YX45WP4ZP11V1A', 'Date': 'Fri, 11 Nov 2022 01:18:45 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180813T000000, start_date=20221111T011842, end_date=20221111T011846 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-08-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:18:46.702626Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2c17f268-c350-49f9-ac08-cf7e5a985eef"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..6ec5ed26 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:18:33.827846Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51199c50-abfc-393e-97cd-4cf94f66dabc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51199c50-abfc-393e-97cd-4cf94f66dabc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f956c9ae-0bd9-46a8-b108-ae2f194c5d1c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-08-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:18:33.827846+00:00, try_number=1, job_id=1046, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-13 00:00:00+00:00 +INFO - Started process 8501 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-08-13T00:00:00+00:00', '--job-id', '1046', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpmg746mtg'] +INFO - Job 1046: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180813T000000, start_date=20221111T011833, end_date=20221111T011848 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-08-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:18:48.630669Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f956c9ae-0bd9-46a8-b108-ae2f194c5d1c"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..ff847794 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-13T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:18:32.524678Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-13T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51199c50-abfc-393e-97cd-4cf94f66dabc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51199c50-abfc-393e-97cd-4cf94f66dabc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "091ad3e8-0262-4f06-863b-89a16a998db4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-08-13T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:18:32.524678+00:00, try_number=1, job_id=1045, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-13 00:00:00+00:00 +INFO - Started process 8498 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-08-13T00:00:00+00:00', '--job-id', '1045', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpg9qblmg6'] +INFO - Job 1045: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-13T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-13T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180813T000000, start_date=20221111T011832, end_date=20221111T011836 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-08-13T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:18:36.718941Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "091ad3e8-0262-4f06-863b-89a16a998db4"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..7a2cd582 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:19:02.428979Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51bd91ad-f02f-3ff9-9fc7-3959cfd3e75c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51bd91ad-f02f-3ff9-9fc7-3959cfd3e75c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4986243c-4535-4a43-99e9-53753e25571f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-08-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:19:02.428979+00:00, try_number=1, job_id=1050, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-14 00:00:00+00:00 +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-08-14T00:00:00+00:00', '--job-id', '1050', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpvo1oxarp'] +INFO - Started process 8349 to run task +INFO - Job 1050: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180814T000000, start_date=20221111T011902, end_date=20221111T011906 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-08-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:19:06.774089Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4986243c-4535-4a43-99e9-53753e25571f"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..682b45ea --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:19:00.736243Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51bd91ad-f02f-3ff9-9fc7-3959cfd3e75c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51bd91ad-f02f-3ff9-9fc7-3959cfd3e75c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "898b0af8-d553-43c8-a2f3-809a512fcbc1"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-08-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:19:00.736243+00:00, try_number=1, job_id=1049, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-14 00:00:00+00:00 +INFO - Started process 8346 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-08-14T00:00:00+00:00', '--job-id', '1049', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpbg4o6_i1'] +INFO - Job 1049: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180814T000000, start_date=20221111T011900, end_date=20221111T011905 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-08-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:19:05.646750Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "898b0af8-d553-43c8-a2f3-809a512fcbc1"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..9152d1ea --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:19:33.630033Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51bd91ad-f02f-3ff9-9fc7-3959cfd3e75c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51bd91ad-f02f-3ff9-9fc7-3959cfd3e75c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a16adc79-0053-4282-91b5-ff4fb1bb8a0b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-08-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:19:33.630033+00:00, try_number=1, job_id=1054, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-14 00:00:00+00:00 +INFO - Started process 8533 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-08-14T00:00:00+00:00', '--job-id', '1054', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpg3xuw9eo'] +INFO - Job 1054: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f1f70> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'GVUGtJ/Ijtllnm4m9syzmw==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:GVUGtJ/Ijtllnm4m9syzmw== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011935Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011935Z +20221111/us-east-1/s3/aws4_request +fe4a414cffc9ca94fc4e942a91fff39a6ade57bbb5b1a3f78476285485e6cc34 +INFO - '2022-11-11' - botocore.auth - Signature: +937a1e2c85d52c9f6701a420612f9ed7aafbe09436c5930c0f3c0dba69a0473c +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'FjoLpvNZNezrAJX+7Ot3Sa2v1C9OZJIZ8LoOUBAgAgAeNUjP1VUkiHAjh+AABNH4tjDrhbN+0lU=', 'x-amz-request-id': '30S9J8RW2182SBSK', 'Date': 'Fri, 11 Nov 2022 01:19:36 GMT', 'ETag': '"195506b49fc88ed9659e6e26f6ccb39b"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180814T000000, start_date=20221111T011933, end_date=20221111T011936 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-08-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:19:36.977173Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a16adc79-0053-4282-91b5-ff4fb1bb8a0b"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..422a88ab --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:19:19.452710Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51bd91ad-f02f-3ff9-9fc7-3959cfd3e75c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51bd91ad-f02f-3ff9-9fc7-3959cfd3e75c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cb46e639-f077-4824-a3d4-eebdf4a142b3"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-08-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:19:19.452710+00:00, try_number=1, job_id=1053, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-14 00:00:00+00:00 +INFO - Started process 8526 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-08-14T00:00:00+00:00', '--job-id', '1053', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp6nh166cz'] +INFO - Job 1053: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f6249954550> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T011921Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T011921Z +20221111/us-east-1/s3/aws4_request +a63de57b8425a93ae7f6710fa550610248c89e1373990251a3dc7835659c0830 +INFO - '2022-11-11' - botocore.auth - Signature: +0b3e54e84199ecd89e5e439495adb1bbe55937af0b54954124714867491c610b +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'mN32uVip7QWD8EyygwtYSPaQid/i0YZSyc5w4Yl2OCt2AVxaNZEmEczDQYcXw4tCZ5sPNf4P1tk=', 'x-amz-request-id': 'SJK021KZDNRMQDR7', 'Date': 'Fri, 11 Nov 2022 01:19:22 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180814T000000, start_date=20221111T011919, end_date=20221111T011923 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-08-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:19:23.381826Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cb46e639-f077-4824-a3d4-eebdf4a142b3"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..2a85b1ed --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:19:12.639531Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51bd91ad-f02f-3ff9-9fc7-3959cfd3e75c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51bd91ad-f02f-3ff9-9fc7-3959cfd3e75c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0f5c3e33-b1c5-45ed-8c53-c6675dcf0a07"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-08-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:19:12.639531+00:00, try_number=1, job_id=1052, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-14 00:00:00+00:00 +INFO - Started process 8359 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-08-14T00:00:00+00:00', '--job-id', '1052', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp3aomyv7g'] +INFO - Job 1052: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180814T000000, start_date=20221111T011912, end_date=20221111T011929 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-08-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:19:29.878975Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0f5c3e33-b1c5-45ed-8c53-c6675dcf0a07"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..eb36389c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-14T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:19:09.866958Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-14T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51bd91ad-f02f-3ff9-9fc7-3959cfd3e75c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "51bd91ad-f02f-3ff9-9fc7-3959cfd3e75c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ae3aaa5e-d338-44c2-9621-2c9f654b7fbf"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-08-14T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:19:09.866958+00:00, try_number=1, job_id=1051, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-14 00:00:00+00:00 +INFO - Started process 8356 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-08-14T00:00:00+00:00', '--job-id', '1051', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpwsddt3kf'] +INFO - Job 1051: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-14T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-14T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180814T000000, start_date=20221111T011909, end_date=20221111T011914 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-08-14T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:19:14.968727Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ae3aaa5e-d338-44c2-9621-2c9f654b7fbf"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..9e735cae --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:19:42.564314Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "67269ee8-192c-31fe-98bc-7c91ccdb93fa"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "67269ee8-192c-31fe-98bc-7c91ccdb93fa"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "adfd5002-6988-4f13-af89-4070a3ac5d41"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-08-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:19:42.564314+00:00, try_number=1, job_id=1056, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-15 00:00:00+00:00 +INFO - Started process 8374 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-08-15T00:00:00+00:00', '--job-id', '1056', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp4vjarbkj'] +INFO - Job 1056: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180815T000000, start_date=20221111T011942, end_date=20221111T011947 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-08-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:19:47.065320Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "adfd5002-6988-4f13-af89-4070a3ac5d41"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..1cfd005b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:19:41.841317Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "67269ee8-192c-31fe-98bc-7c91ccdb93fa"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "67269ee8-192c-31fe-98bc-7c91ccdb93fa"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2ace1962-5617-4b92-8f54-067cacbf7dbd"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-08-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:19:41.841317+00:00, try_number=1, job_id=1055, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-15 00:00:00+00:00 +INFO - Started process 8371 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-08-15T00:00:00+00:00', '--job-id', '1055', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp3lcnmzth'] +INFO - Job 1055: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180815T000000, start_date=20221111T011941, end_date=20221111T011946 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-08-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:19:46.020942Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2ace1962-5617-4b92-8f54-067cacbf7dbd"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..c903abd4 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:20:10.446955Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "67269ee8-192c-31fe-98bc-7c91ccdb93fa"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "67269ee8-192c-31fe-98bc-7c91ccdb93fa"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ad56cb1a-106f-4db0-b5cc-9c4e151db187"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-08-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:20:10.446955+00:00, try_number=1, job_id=1060, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-15 00:00:00+00:00 +INFO - Started process 8557 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-08-15T00:00:00+00:00', '--job-id', '1060', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpva_83n0f'] +INFO - Job 1060: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f1ee0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'GVUGtJ/Ijtllnm4m9syzmw==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:GVUGtJ/Ijtllnm4m9syzmw== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T012012Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T012012Z +20221111/us-east-1/s3/aws4_request +c1b0d87580af2843a43301a9956573f18a1c5d9f6f94c479dc65709a71f176af +INFO - '2022-11-11' - botocore.auth - Signature: +30ac1a454d91341cadfce63d913483f95f25901fbdcc3f41de602a1a81c16aa8 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'Uxx1LrMosue8KT6ZoSrnmrkWeguuHpdqWz3jSCYC739WSCHAx/gcX57bxcVs1HfOgKsfKp/loKE=', 'x-amz-request-id': '1PSW7MDP1NM2KM72', 'Date': 'Fri, 11 Nov 2022 01:20:13 GMT', 'ETag': '"195506b49fc88ed9659e6e26f6ccb39b"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180815T000000, start_date=20221111T012010, end_date=20221111T012014 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-08-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:20:14.807586Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ad56cb1a-106f-4db0-b5cc-9c4e151db187"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..ee427637 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:19:57.711385Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "67269ee8-192c-31fe-98bc-7c91ccdb93fa"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "67269ee8-192c-31fe-98bc-7c91ccdb93fa"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6ee11ff3-d719-407b-9090-085a4f0b5354"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-08-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:19:57.711385+00:00, try_number=1, job_id=1059, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-15 00:00:00+00:00 +INFO - Started process 8550 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-08-15T00:00:00+00:00', '--job-id', '1059', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp0f267y5m'] +INFO - Job 1059: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f6249954550> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T012000Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T012000Z +20221111/us-east-1/s3/aws4_request +72f053b06c0638477eba93cf044d05917bbd342ebf9a4e4923b6697a5f21836f +INFO - '2022-11-11' - botocore.auth - Signature: +eda6cef123681efe52c7ae6246e93ca3570c9fb8a6c9fe3f01da2022aee91351 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'bOeAUR0dwvB5BjObKkB6VcCDAx7ndEr+w2LTUgdKOhEupqoaf6AXz/gv/Yip1A6I6Yi7FtfsPSc=', 'x-amz-request-id': 'KBQD67R38YJPRDCT', 'Date': 'Fri, 11 Nov 2022 01:20:01 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180815T000000, start_date=20221111T011957, end_date=20221111T012002 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-08-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:20:02.093796Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6ee11ff3-d719-407b-9090-085a4f0b5354"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..9bc7e4d4 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:19:50.525543Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "67269ee8-192c-31fe-98bc-7c91ccdb93fa"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "67269ee8-192c-31fe-98bc-7c91ccdb93fa"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c4bd2711-e00d-42c9-a4bc-4808a509aabf"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-08-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:19:50.525543+00:00, try_number=1, job_id=1058, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-15 00:00:00+00:00 +INFO - Started process 8380 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-08-15T00:00:00+00:00', '--job-id', '1058', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpkee07d9e'] +INFO - Job 1058: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180815T000000, start_date=20221111T011950, end_date=20221111T012006 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-08-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:20:06.561308Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c4bd2711-e00d-42c9-a4bc-4808a509aabf"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..b7577915 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-15T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:19:50.076972Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-15T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "67269ee8-192c-31fe-98bc-7c91ccdb93fa"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "67269ee8-192c-31fe-98bc-7c91ccdb93fa"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "be8dd757-c82d-4462-9d09-fa3224a2f319"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-08-15T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:19:50.076972+00:00, try_number=1, job_id=1057, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-15 00:00:00+00:00 +INFO - Started process 8545 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-08-15T00:00:00+00:00', '--job-id', '1057', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp1rxoptkk'] +INFO - Job 1057: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-15T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-15T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180815T000000, start_date=20221111T011950, end_date=20221111T011953 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-08-15T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:19:53.934065Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "be8dd757-c82d-4462-9d09-fa3224a2f319"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..4aff753d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:20:19.295195Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b6b7f9b3-3a56-363e-ac73-64f48b9bfd6f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b6b7f9b3-3a56-363e-ac73-64f48b9bfd6f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9c36ae84-201b-4c05-aeef-59a23b57f144"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-08-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:20:19.295195+00:00, try_number=1, job_id=1061, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-16 00:00:00+00:00 +INFO - Started process 8387 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-08-16T00:00:00+00:00', '--job-id', '1061', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpar41_65r'] +INFO - Job 1061: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180816T000000, start_date=20221111T012019, end_date=20221111T012023 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-08-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:20:23.705016Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9c36ae84-201b-4c05-aeef-59a23b57f144"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..287d83af --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:20:19.316391Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b6b7f9b3-3a56-363e-ac73-64f48b9bfd6f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b6b7f9b3-3a56-363e-ac73-64f48b9bfd6f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2330567c-bcc2-4596-9a07-4201fef11c9c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-08-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:20:19.316391+00:00, try_number=1, job_id=1062, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-16 00:00:00+00:00 +INFO - Started process 8389 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-08-16T00:00:00+00:00', '--job-id', '1062', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpbc_m9_69'] +INFO - Job 1062: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180816T000000, start_date=20221111T012019, end_date=20221111T012024 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-08-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:20:24.123948Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2330567c-bcc2-4596-9a07-4201fef11c9c"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..bbee10fd --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:20:45.909821Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b6b7f9b3-3a56-363e-ac73-64f48b9bfd6f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b6b7f9b3-3a56-363e-ac73-64f48b9bfd6f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ccd9134f-b23d-4ba7-bd89-d9717be8a61b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-08-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:20:45.909821+00:00, try_number=1, job_id=1066, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-16 00:00:00+00:00 +INFO - Started process 8407 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-08-16T00:00:00+00:00', '--job-id', '1066', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpubn87aj4'] +INFO - Job 1066: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5ca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '34BfETy+VmJG5fM68O+HFQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:34BfETy+VmJG5fM68O+HFQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T012047Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T012047Z +20221111/us-east-1/s3/aws4_request +060bd371d08532d0a29bafa2069a460a27e53e69ad163a48a8af9b990a240181 +INFO - '2022-11-11' - botocore.auth - Signature: +ce31cbc438928ba5619e357b61d9097b81a479f79fdf97d9b61adbc3547d89f9 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'jV08g8KAZmzi2G4GwYnxftialKee6chYvkHIRofQKFDU94R5knIVRp8uk70Cml/t/9CFH+sLh+w=', 'x-amz-request-id': 'M9HYM7AMS0TQ5TQH', 'Date': 'Fri, 11 Nov 2022 01:20:48 GMT', 'ETag': '"df805f113cbe566246e5f33af0ef8715"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180816T000000, start_date=20221111T012045, end_date=20221111T012049 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-08-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:20:49.277767Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ccd9134f-b23d-4ba7-bd89-d9717be8a61b"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..59dd8533 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:20:38.954536Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b6b7f9b3-3a56-363e-ac73-64f48b9bfd6f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b6b7f9b3-3a56-363e-ac73-64f48b9bfd6f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "035abadb-e387-468e-97d2-96727d252eab"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-08-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:20:38.954536+00:00, try_number=1, job_id=1065, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-16 00:00:00+00:00 +INFO - Started process 8400 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-08-16T00:00:00+00:00', '--job-id', '1065', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp6688o67l'] +INFO - Job 1065: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f50073a0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T012040Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T012040Z +20221111/us-east-1/s3/aws4_request +711e2f6ad7e8f09c8383dcdf0312c99d148f69cea14fe4ad6571a14c6ba1708c +INFO - '2022-11-11' - botocore.auth - Signature: +bde8dfe3fbce96c64ebded9970dfca6769ffdc051b2f08d1c1acb0d9fed2075a +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'K2Fo2+FCYGICJzmnEsX76tHMHRhBfRJL/Pdt7Pgj0/FJrj3ojckr+bldiEEmResiwprZAvKsMq0=', 'x-amz-request-id': 'FE1KG29P6153QA5T', 'Date': 'Fri, 11 Nov 2022 01:20:41 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180816T000000, start_date=20221111T012038, end_date=20221111T012042 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-08-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:20:42.674906Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "035abadb-e387-468e-97d2-96727d252eab"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..7c57fc48 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:20:29.197952Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b6b7f9b3-3a56-363e-ac73-64f48b9bfd6f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b6b7f9b3-3a56-363e-ac73-64f48b9bfd6f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8d20ba48-06f9-446c-89c9-69a5a8f44e25"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-08-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:20:29.197952+00:00, try_number=1, job_id=1063, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-16 00:00:00+00:00 +INFO - Started process 8566 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-08-16T00:00:00+00:00', '--job-id', '1063', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp0i1i7g2h'] +INFO - Job 1063: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180816T000000, start_date=20221111T012029, end_date=20221111T012042 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-08-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:20:42.674608Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8d20ba48-06f9-446c-89c9-69a5a8f44e25"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..cd6f9d08 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-16T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:20:29.226084Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-16T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b6b7f9b3-3a56-363e-ac73-64f48b9bfd6f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "b6b7f9b3-3a56-363e-ac73-64f48b9bfd6f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7e63f07f-f360-4ee5-9b7a-6fe544a79b42"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-08-16T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:20:29.226084+00:00, try_number=1, job_id=1064, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-16 00:00:00+00:00 +INFO - Started process 8568 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-08-16T00:00:00+00:00', '--job-id', '1064', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp0fwvci38'] +INFO - Job 1064: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-16T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-16T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180816T000000, start_date=20221111T012029, end_date=20221111T012035 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-08-16T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:20:35.020041Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7e63f07f-f360-4ee5-9b7a-6fe544a79b42"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..f9cacaf4 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:20:53.114725Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ef81cc49-1bc1-3568-a57d-66f34035deea"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ef81cc49-1bc1-3568-a57d-66f34035deea"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "312879ed-6009-497d-936a-69fe52cc170f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-08-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:20:53.114725+00:00, try_number=1, job_id=1067, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-17 00:00:00+00:00 +INFO - Started process 8416 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-08-17T00:00:00+00:00', '--job-id', '1067', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp3shp0nsw'] +INFO - Job 1067: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180817T000000, start_date=20221111T012053, end_date=20221111T012057 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-08-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:20:57.939693Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "312879ed-6009-497d-936a-69fe52cc170f"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..a293ebce --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:20:53.215400Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ef81cc49-1bc1-3568-a57d-66f34035deea"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ef81cc49-1bc1-3568-a57d-66f34035deea"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f505ad1f-35d7-4cce-ae7e-428cd4d240d1"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-08-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:20:53.215400+00:00, try_number=1, job_id=1068, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-17 00:00:00+00:00 +INFO - Started process 8418 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-08-17T00:00:00+00:00', '--job-id', '1068', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpn2higo3w'] +INFO - Job 1068: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180817T000000, start_date=20221111T012053, end_date=20221111T012058 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-08-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:20:58.321369Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f505ad1f-35d7-4cce-ae7e-428cd4d240d1"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..127abccf --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:21:18.726706Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ef81cc49-1bc1-3568-a57d-66f34035deea"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ef81cc49-1bc1-3568-a57d-66f34035deea"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3e3adb39-4abf-433d-87a2-d59906ccff08"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-08-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:21:18.726706+00:00, try_number=1, job_id=1072, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-17 00:00:00+00:00 +INFO - Started process 8586 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-08-17T00:00:00+00:00', '--job-id', '1072', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp5vxtyzvy'] +INFO - Job 1072: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BD8lD/cN0nuJUY16HgrlBA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:BD8lD/cN0nuJUY16HgrlBA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T012120Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T012120Z +20221111/us-east-1/s3/aws4_request +263c33a10729f1ff153466bdb0bea194a39b42368ff3c601e293b14c08588443 +INFO - '2022-11-11' - botocore.auth - Signature: +dc2ddb93efbf6da8566034d5337f84ff7838f18c43dd4ae1cdac1e84076738ad +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'OSpi1x9lmefDse/SSwYPuSFc/S7mYr4jedWf52J4kEL6rLA/WUrC5hedEvUDfY4wtjuqp8ErJjE=', 'x-amz-request-id': 'X1A6NKGTGVZFCJKS', 'Date': 'Fri, 11 Nov 2022 01:21:21 GMT', 'ETag': '"043f250ff70dd27b89518d7a1e0ae504"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180817T000000, start_date=20221111T012118, end_date=20221111T012122 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-08-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:21:22.712024Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3e3adb39-4abf-433d-87a2-d59906ccff08"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..d31e1f55 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:21:11.159851Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ef81cc49-1bc1-3568-a57d-66f34035deea"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ef81cc49-1bc1-3568-a57d-66f34035deea"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a691c769-2c43-4343-bf13-b116dbe7bfc1"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-08-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:21:11.159851+00:00, try_number=1, job_id=1071, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-17 00:00:00+00:00 +INFO - Started process 8579 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-08-17T00:00:00+00:00', '--job-id', '1071', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmps23h33t_'] +INFO - Job 1071: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f6249952550> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T012113Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T012113Z +20221111/us-east-1/s3/aws4_request +c07bea4812f24f6e49b079eb88fa77ffebece4788c69be61684abbf5c4f799f3 +INFO - '2022-11-11' - botocore.auth - Signature: +901e8d7b994321057bbd059106a2ad670b4d2c974aedf420aa8fc61f84064f68 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'IHx65wT1oofNT7USxDm+UtZg5ZqMHeYtVI8eHX8Bp4jiyCgyQ9XwiUh015tzFGlJ70noepE7T0A=', 'x-amz-request-id': 'NPPAHBA3ETET0B16', 'Date': 'Fri, 11 Nov 2022 01:21:14 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180817T000000, start_date=20221111T012111, end_date=20221111T012114 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-08-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:21:14.847318Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a691c769-2c43-4343-bf13-b116dbe7bfc1"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..a805c8c9 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:21:00.786984Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ef81cc49-1bc1-3568-a57d-66f34035deea"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ef81cc49-1bc1-3568-a57d-66f34035deea"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d61c6365-c5f4-4476-814c-188bfc95b467"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-08-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:21:00.786984+00:00, try_number=1, job_id=1069, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-17 00:00:00+00:00 +INFO - Started process 8425 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-08-17T00:00:00+00:00', '--job-id', '1069', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpx1fbk53d'] +INFO - Job 1069: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180817T000000, start_date=20221111T012100, end_date=20221111T012115 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-08-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:21:15.536612Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d61c6365-c5f4-4476-814c-188bfc95b467"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..27733778 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-17T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:21:01.331662Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-17T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ef81cc49-1bc1-3568-a57d-66f34035deea"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "ef81cc49-1bc1-3568-a57d-66f34035deea"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "dee970ce-3bf0-4aa9-b153-46a1daf46541"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-08-17T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:21:01.331662+00:00, try_number=1, job_id=1070, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-17 00:00:00+00:00 +INFO - Started process 8428 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-08-17T00:00:00+00:00', '--job-id', '1070', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpp1avcmdp'] +INFO - Job 1070: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-17T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-17T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180817T000000, start_date=20221111T012101, end_date=20221111T012106 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-08-17T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:21:06.922383Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "dee970ce-3bf0-4aa9-b153-46a1daf46541"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..ad6cd3db --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:21:26.051739Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "840b1a35-bd97-3d78-a012-558eb355f9e8"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "840b1a35-bd97-3d78-a012-558eb355f9e8"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a61b07a6-f02c-4cc8-92f1-9309b9b75855"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-08-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:21:26.051739+00:00, try_number=1, job_id=1074, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-18 00:00:00+00:00 +INFO - Started process 8441 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-08-18T00:00:00+00:00', '--job-id', '1074', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp0jjxww4m'] +INFO - Job 1074: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180818T000000, start_date=20221111T012126, end_date=20221111T012130 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-08-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:21:30.527480Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a61b07a6-f02c-4cc8-92f1-9309b9b75855"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..f1fa8d64 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:21:26.095532Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "840b1a35-bd97-3d78-a012-558eb355f9e8"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "840b1a35-bd97-3d78-a012-558eb355f9e8"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a6bce5f4-aed1-4a5f-866e-96828ec46562"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-08-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:21:26.095532+00:00, try_number=1, job_id=1073, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-18 00:00:00+00:00 +INFO - Started process 8443 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-08-18T00:00:00+00:00', '--job-id', '1073', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpmt2hk1os'] +INFO - Job 1073: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180818T000000, start_date=20221111T012126, end_date=20221111T012130 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-08-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:21:30.539381Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a6bce5f4-aed1-4a5f-866e-96828ec46562"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..f1ab946d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:21:52.701032Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "840b1a35-bd97-3d78-a012-558eb355f9e8"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "840b1a35-bd97-3d78-a012-558eb355f9e8"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "077dfb04-c9e9-4b76-98d3-9ef1e4caa249"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-08-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:21:52.701032+00:00, try_number=1, job_id=1078, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-18 00:00:00+00:00 +INFO - Started process 8615 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-08-18T00:00:00+00:00', '--job-id', '1078', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpesahpyta'] +INFO - Job 1078: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0ee0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '6KwOXMV47/QsC84rFXF39w==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:6KwOXMV47/QsC84rFXF39w== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T012155Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T012155Z +20221111/us-east-1/s3/aws4_request +03cf2292f0f3adf514e8abe4fa6be32cb30553f45755e36c75f012d94665aba7 +INFO - '2022-11-11' - botocore.auth - Signature: +fc8f89c7a2f65beb3161015940d53e83cdd18e656df7971cbc7f29b57cfe9812 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'HK8lyaryx/IOaV0hRfFHyl3XrbXjN3TCDyvnzN7jObDtznAMjk8e2Vgbz1fFUYWKnraBwOHiCL3XUiwgobkrjA==', 'x-amz-request-id': 'SJZHQDAVV7AE4SMQ', 'Date': 'Fri, 11 Nov 2022 01:21:56 GMT', 'ETag': '"e8ac0e5cc578eff42c0bce2b157177f7"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180818T000000, start_date=20221111T012152, end_date=20221111T012157 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-08-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:21:57.008237Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "077dfb04-c9e9-4b76-98d3-9ef1e4caa249"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..c3ae7bba --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:21:43.577361Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "840b1a35-bd97-3d78-a012-558eb355f9e8"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "840b1a35-bd97-3d78-a012-558eb355f9e8"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "60d0f555-4c8c-474d-9c80-1d6a9624ff45"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-08-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:21:43.577361+00:00, try_number=1, job_id=1077, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-18 00:00:00+00:00 +INFO - Started process 8607 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-08-18T00:00:00+00:00', '--job-id', '1077', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmph82bv838'] +INFO - Job 1077: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f6249954550> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T012146Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T012146Z +20221111/us-east-1/s3/aws4_request +571d4ccd5b7f5efa76742357acafb9765ce7dfe4a0c008994a4a0304bc2cf40d +INFO - '2022-11-11' - botocore.auth - Signature: +9b81b25689c885d0e14aa627fe458e58f6a2ad4b0a68fd56ac47a2a37b26f730 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'qzOmEU4ZDLsJQhpRaNUlG1DiPE0uGpWUoUoOTNbwXfi71Ff58OkQPaL5RNqpmVvHT3PLZRMfEo8=', 'x-amz-request-id': '4BHGB1QM44RM8T92', 'Date': 'Fri, 11 Nov 2022 01:21:47 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180818T000000, start_date=20221111T012143, end_date=20221111T012148 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-08-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:21:48.498601Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "60d0f555-4c8c-474d-9c80-1d6a9624ff45"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..69cb37e1 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:21:33.958532Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "840b1a35-bd97-3d78-a012-558eb355f9e8"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "840b1a35-bd97-3d78-a012-558eb355f9e8"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "794d8e48-bfce-4413-bbf4-6e136e42fd36"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-08-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:21:33.958532+00:00, try_number=1, job_id=1076, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-18 00:00:00+00:00 +INFO - Started process 8602 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-08-18T00:00:00+00:00', '--job-id', '1076', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpss6hg4yd'] +INFO - Job 1076: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180818T000000, start_date=20221111T012133, end_date=20221111T012148 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-08-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:21:48.644405Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "794d8e48-bfce-4413-bbf4-6e136e42fd36"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..399d5156 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-18T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:21:33.933904Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-18T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "840b1a35-bd97-3d78-a012-558eb355f9e8"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "840b1a35-bd97-3d78-a012-558eb355f9e8"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "72b5fb24-5064-41f5-9fab-c405852e7660"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-08-18T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:21:33.933904+00:00, try_number=1, job_id=1075, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-18 00:00:00+00:00 +INFO - Started process 8599 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-08-18T00:00:00+00:00', '--job-id', '1075', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmphf7zp8h5'] +INFO - Job 1075: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-18T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-18T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180818T000000, start_date=20221111T012133, end_date=20221111T012138 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-08-18T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:21:38.098962Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "72b5fb24-5064-41f5-9fab-c405852e7660"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..89379c31 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:22:01.049066Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "757b5a3f-c9c8-3c83-8aa6-119f2c923177"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "757b5a3f-c9c8-3c83-8aa6-119f2c923177"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c64b9269-0a96-49bb-b541-ffec48f45a25"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-08-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:22:01.049066+00:00, try_number=1, job_id=1079, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-19 00:00:00+00:00 +INFO - Started process 8626 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-08-19T00:00:00+00:00', '--job-id', '1079', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpie6t4h78'] +INFO - Job 1079: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180819T000000, start_date=20221111T012201, end_date=20221111T012205 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-08-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:22:05.765323Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c64b9269-0a96-49bb-b541-ffec48f45a25"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..0e547065 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:22:01.038380Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "757b5a3f-c9c8-3c83-8aa6-119f2c923177"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "757b5a3f-c9c8-3c83-8aa6-119f2c923177"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4f7af0f0-e3fc-41fa-be89-340c23607b7d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-08-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:22:01.038380+00:00, try_number=1, job_id=1080, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-19 00:00:00+00:00 +INFO - Started process 8624 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-08-19T00:00:00+00:00', '--job-id', '1080', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp0lvekbk7'] +INFO - Job 1080: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180819T000000, start_date=20221111T012201, end_date=20221111T012205 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-08-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:22:05.735457Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4f7af0f0-e3fc-41fa-be89-340c23607b7d"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..956156f2 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:22:29.600742Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "757b5a3f-c9c8-3c83-8aa6-119f2c923177"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "757b5a3f-c9c8-3c83-8aa6-119f2c923177"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ec27e953-2081-4124-a056-bf911c9e0e53"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-08-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:22:29.600742+00:00, try_number=1, job_id=1084, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-19 00:00:00+00:00 +INFO - Started process 8642 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-08-19T00:00:00+00:00', '--job-id', '1084', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp7huobfg0'] +INFO - Job 1084: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498efca0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '6KwOXMV47/QsC84rFXF39w==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:6KwOXMV47/QsC84rFXF39w== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T012231Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T012231Z +20221111/us-east-1/s3/aws4_request +9986825be4e350b8aaa4ccd4b2baae130e190aed78564533e90d11eeff4390eb +INFO - '2022-11-11' - botocore.auth - Signature: +f3dee5353c4ea92faf5b0a483f67389033894686595db92a080949594fd08f97 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'wWKCdUDUpvUngCgsNn3rB4RMM4wA6o/rB+qQPu72aBlNwfKXYui/KdF5i6pSv3PcGeuKi6JbMlc=', 'x-amz-request-id': '246MPEQX09YQ5D01', 'Date': 'Fri, 11 Nov 2022 01:22:32 GMT', 'ETag': '"e8ac0e5cc578eff42c0bce2b157177f7"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180819T000000, start_date=20221111T012229, end_date=20221111T012233 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-08-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:22:33.274845Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ec27e953-2081-4124-a056-bf911c9e0e53"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..79312518 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:22:18.736365Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "757b5a3f-c9c8-3c83-8aa6-119f2c923177"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "757b5a3f-c9c8-3c83-8aa6-119f2c923177"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "db07df3e-77f2-4fac-a62d-80686b4bbfac"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-08-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:22:18.736365+00:00, try_number=1, job_id=1083, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-19 00:00:00+00:00 +INFO - Started process 8458 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-08-19T00:00:00+00:00', '--job-id', '1083', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpj5feaf97'] +INFO - Job 1083: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f5006550> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T012222Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T012222Z +20221111/us-east-1/s3/aws4_request +7e664efd5609af1c8a447d128e45bd14a7acb785c77467699a919987f47c74b6 +INFO - '2022-11-11' - botocore.auth - Signature: +0c02526c185aaf534b47a4ad83daacc56e2d55fcd882a9755337ce63b4fa4108 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'obVTF+ydF7aNFIqSsMDKuHMKdbozTJP+LVq3X5nM34xgnsENx8fWoM9omOcYloMMqGZ7ANPaPdw=', 'x-amz-request-id': 'V4SVQ8ZWH2GZ9SS5', 'Date': 'Fri, 11 Nov 2022 01:22:23 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180819T000000, start_date=20221111T012218, end_date=20221111T012224 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-08-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:22:24.937600Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "db07df3e-77f2-4fac-a62d-80686b4bbfac"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..c7e9ef4f --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:22:10.530644Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "757b5a3f-c9c8-3c83-8aa6-119f2c923177"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "757b5a3f-c9c8-3c83-8aa6-119f2c923177"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d8a7d354-157c-45f5-a890-2221c7c4a187"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-08-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:22:10.530644+00:00, try_number=1, job_id=1081, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-19 00:00:00+00:00 +INFO - Started process 8449 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-08-19T00:00:00+00:00', '--job-id', '1081', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp3cdkpufn'] +INFO - Job 1081: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180819T000000, start_date=20221111T012210, end_date=20221111T012225 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-08-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:22:25.530410Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d8a7d354-157c-45f5-a890-2221c7c4a187"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..f46f9bf5 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-19T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:22:10.664580Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-19T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "757b5a3f-c9c8-3c83-8aa6-119f2c923177"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "757b5a3f-c9c8-3c83-8aa6-119f2c923177"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "181882a4-6cfc-49fb-82c1-dd4566cb66c8"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-08-19T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:22:10.664580+00:00, try_number=1, job_id=1082, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-19 00:00:00+00:00 +INFO - Started process 8632 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-08-19T00:00:00+00:00', '--job-id', '1082', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpcim54g03'] +INFO - Job 1082: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-19T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-19T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180819T000000, start_date=20221111T012210, end_date=20221111T012214 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-08-19T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:22:14.689998Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "181882a4-6cfc-49fb-82c1-dd4566cb66c8"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..2382ec31 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:22:37.760265Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "343900a7-0b28-3b6e-987f-a5c234706613"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "343900a7-0b28-3b6e-987f-a5c234706613"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cc495ba8-7ba7-4825-95ac-f53349574c61"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-08-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:22:37.760265+00:00, try_number=1, job_id=1085, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-20 00:00:00+00:00 +INFO - Started process 8467 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-08-20T00:00:00+00:00', '--job-id', '1085', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpr9bvnh53'] +INFO - Job 1085: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180820T000000, start_date=20221111T012237, end_date=20221111T012241 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-08-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:22:41.887928Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cc495ba8-7ba7-4825-95ac-f53349574c61"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..3f5299fc --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:22:37.793485Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "343900a7-0b28-3b6e-987f-a5c234706613"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "343900a7-0b28-3b6e-987f-a5c234706613"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c66b98ba-85b2-4cc7-a507-0d705b6090a5"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-08-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:22:37.793485+00:00, try_number=1, job_id=1086, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-20 00:00:00+00:00 +INFO - Started process 8470 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-08-20T00:00:00+00:00', '--job-id', '1086', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpw6lfu8_x'] +INFO - Job 1086: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180820T000000, start_date=20221111T012237, end_date=20221111T012242 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-08-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:22:42.645008Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c66b98ba-85b2-4cc7-a507-0d705b6090a5"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..e33a1787 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:23:06.092355Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "343900a7-0b28-3b6e-987f-a5c234706613"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "343900a7-0b28-3b6e-987f-a5c234706613"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c1697e7d-82de-444e-81a8-9822e8dce643"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-08-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:23:06.092355+00:00, try_number=1, job_id=1090, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-20 00:00:00+00:00 +INFO - Started process 8661 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-08-20T00:00:00+00:00', '--job-id', '1090', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpx7u1atcd'] +INFO - Job 1090: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62498f0940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '6KwOXMV47/QsC84rFXF39w==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:6KwOXMV47/QsC84rFXF39w== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T012307Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T012307Z +20221111/us-east-1/s3/aws4_request +7db51e231b70d9b52e50d0c6996ce3b0730bb1dbc695564f4e5c969f148fa054 +INFO - '2022-11-11' - botocore.auth - Signature: +1eccf73e2cd47d10b31077ae3deba7f8a989069d045e806b1c82672bf1335547 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'tYSDcsN5KjOqjxDO/7jP6+7TibVehlL61+uxHL4ctUOf/bZHQEEp9joRqSKNDvvQefLZhLNk9q4=', 'x-amz-request-id': 'VBB52PRPZF9EG521', 'Date': 'Fri, 11 Nov 2022 01:23:08 GMT', 'ETag': '"e8ac0e5cc578eff42c0bce2b157177f7"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180820T000000, start_date=20221111T012306, end_date=20221111T012308 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-08-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:23:08.966830Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c1697e7d-82de-444e-81a8-9822e8dce643"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..6f269acd --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:22:58.214112Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "343900a7-0b28-3b6e-987f-a5c234706613"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "343900a7-0b28-3b6e-987f-a5c234706613"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "58f8ea3b-f225-461b-9b47-50e16518e226"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-08-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:22:58.214112+00:00, try_number=1, job_id=1089, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-20 00:00:00+00:00 +INFO - Started process 8654 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-08-20T00:00:00+00:00', '--job-id', '1089', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpbdti_u85'] +INFO - Job 1089: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f6249954550> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T012300Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T012300Z +20221111/us-east-1/s3/aws4_request +7fe5f08c28d7bd6a7bca45beda77a5eb3d57f42dda9ddb3935a5457292bac480 +INFO - '2022-11-11' - botocore.auth - Signature: +74b0f06191cabf0d05620df2753503fa76ddfd740b48e88c824e1ee67d2c3bed +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'mLUT0DxbMKrcyr3NF4PM631vTNchUavqDCRegzXgmRl6mQjzDg1oITLTZb6//jxKXa4G3JQ5sH0nLpVe6tBhjw==', 'x-amz-request-id': 'HN2G9ERABEH62EHP', 'Date': 'Fri, 11 Nov 2022 01:23:00 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180820T000000, start_date=20221111T012258, end_date=20221111T012301 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-08-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:23:01.828098Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "58f8ea3b-f225-461b-9b47-50e16518e226"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..6f6fd894 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:22:46.725893Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "343900a7-0b28-3b6e-987f-a5c234706613"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "343900a7-0b28-3b6e-987f-a5c234706613"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "56e36f08-1c3d-4def-831a-752ddd6a2950"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-08-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:22:46.725893+00:00, try_number=1, job_id=1087, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-20 00:00:00+00:00 +INFO - Started process 8476 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-08-20T00:00:00+00:00', '--job-id', '1087', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpew_8q3z1'] +INFO - Job 1087: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180820T000000, start_date=20221111T012246, end_date=20221111T012301 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-08-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:23:01.869162Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "56e36f08-1c3d-4def-831a-752ddd6a2950"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..99b02d22 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-20T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:22:47.691442Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-20T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "343900a7-0b28-3b6e-987f-a5c234706613"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "343900a7-0b28-3b6e-987f-a5c234706613"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1519b673-8cb3-40d0-b235-79a53e30bde6"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-08-20T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:22:47.691442+00:00, try_number=1, job_id=1088, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-20 00:00:00+00:00 +INFO - Started process 8649 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-08-20T00:00:00+00:00', '--job-id', '1088', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpbkkjgwfb'] +INFO - Job 1088: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-20T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-20T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180820T000000, start_date=20221111T012247, end_date=20221111T012252 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-08-20T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:22:52.826708Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1519b673-8cb3-40d0-b235-79a53e30bde6"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..92be99f0 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:23:14.245453Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "08f4d622-d951-3a47-a0cc-adaab0209cda"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "08f4d622-d951-3a47-a0cc-adaab0209cda"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a127df5d-171c-465d-b55b-3adba753989a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-08-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:23:14.245453+00:00, try_number=1, job_id=1091, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-21 00:00:00+00:00 +INFO - Started process 8488 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-08-21T00:00:00+00:00', '--job-id', '1091', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp3s879xbk'] +INFO - Job 1091: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180821T000000, start_date=20221111T012314, end_date=20221111T012318 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-08-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:23:18.927490Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a127df5d-171c-465d-b55b-3adba753989a"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..2bd865c7 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:23:14.511276Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "08f4d622-d951-3a47-a0cc-adaab0209cda"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "08f4d622-d951-3a47-a0cc-adaab0209cda"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f2fccf72-4bb3-4222-9c4f-1a2c13a2ab42"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-08-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:23:14.511276+00:00, try_number=1, job_id=1092, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-21 00:00:00+00:00 +INFO - Started process 8490 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-08-21T00:00:00+00:00', '--job-id', '1092', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpwp2y545_'] +INFO - Job 1092: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180821T000000, start_date=20221111T012314, end_date=20221111T012318 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-08-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:23:18.930151Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f2fccf72-4bb3-4222-9c4f-1a2c13a2ab42"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..c8b4dd20 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:23:48.977247Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "08f4d622-d951-3a47-a0cc-adaab0209cda"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "08f4d622-d951-3a47-a0cc-adaab0209cda"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "887b41e6-30d0-4b0c-85ab-011842ef71e5"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-08-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:23:48.977247+00:00, try_number=1, job_id=1096, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-21 00:00:00+00:00 +INFO - Started process 8496 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-08-21T00:00:00+00:00', '--job-id', '1096', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpio3iuzu1'] +INFO - Job 1096: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa6ee0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'flX8mrQqB2AhjRuoQiGGgQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:flX8mrQqB2AhjRuoQiGGgQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T012352Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T012352Z +20221111/us-east-1/s3/aws4_request +2cad67d441650d70dbe7af28204791c78d93da9463a9b41b53460cf8229843f0 +INFO - '2022-11-11' - botocore.auth - Signature: +62d311d29c463e641031149d3c27d132ecd4dae1a9715d1b90a40de72cb93e8f +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'evpif+k9i4DJqtngTuLI6l/lOzpV3FMb7ubS2Y++PkXxKu2QsvioEGsawPWU57mJYzWkSBwuqu4=', 'x-amz-request-id': 'P34E1NGWFS87RWSJ', 'Date': 'Fri, 11 Nov 2022 01:23:52 GMT', 'ETag': '"7e55fc9ab42a0760218d1ba842218681"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180821T000000, start_date=20221111T012348, end_date=20221111T012353 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-08-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:23:53.830060Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "887b41e6-30d0-4b0c-85ab-011842ef71e5"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..64725066 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:23:34.197767Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "08f4d622-d951-3a47-a0cc-adaab0209cda"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "08f4d622-d951-3a47-a0cc-adaab0209cda"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1f819392-2cef-4808-9332-b749a712817e"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-08-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:23:34.197767+00:00, try_number=1, job_id=1095, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-21 00:00:00+00:00 +INFO - Started process 8682 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-08-21T00:00:00+00:00', '--job-id', '1095', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpf4lhrlr3'] +INFO - Job 1095: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f62499511f0> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T012336Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T012336Z +20221111/us-east-1/s3/aws4_request +e9e10288e599c8e89d3828782d24fcf3b6d47fdea17cd3b9e5da1a7a868377e0 +INFO - '2022-11-11' - botocore.auth - Signature: +93258b24c75dbdf5f55cdc6a2d2e3615eb2e112ed007722df7405911cabf27a3 +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'UypG/evVh+t0GtEUu+tZK9wsJ4nGPVozK/Whl2Pc/XXJkCO4wLo935R1z/d//T2RxqWqDP6nV58=', 'x-amz-request-id': 'ZCTQHF6JVD0H2A2E', 'Date': 'Fri, 11 Nov 2022 01:23:37 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180821T000000, start_date=20221111T012334, end_date=20221111T012338 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-08-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:23:38.314310Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1f819392-2cef-4808-9332-b749a712817e"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..f00415b6 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:23:23.203309Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "08f4d622-d951-3a47-a0cc-adaab0209cda"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "08f4d622-d951-3a47-a0cc-adaab0209cda"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d9d2ffcd-cc4a-4ff1-b76a-a4bb9c7e5f4d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-08-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:23:23.203309+00:00, try_number=1, job_id=1093, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-21 00:00:00+00:00 +INFO - Started process 8674 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-08-21T00:00:00+00:00', '--job-id', '1093', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmph8j_8cw6'] +INFO - Job 1093: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180821T000000, start_date=20221111T012323, end_date=20221111T012343 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-08-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:23:43.315084Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d9d2ffcd-cc4a-4ff1-b76a-a4bb9c7e5f4d"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..7883b798 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-21T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:23:23.298798Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-21T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "08f4d622-d951-3a47-a0cc-adaab0209cda"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "08f4d622-d951-3a47-a0cc-adaab0209cda"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d5136835-448f-4259-b575-5064439e964a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-08-21T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:23:23.298798+00:00, try_number=1, job_id=1094, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-21 00:00:00+00:00 +INFO - Started process 8677 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-08-21T00:00:00+00:00', '--job-id', '1094', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp9rnzh6k6'] +INFO - Job 1094: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-21T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-21T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180821T000000, start_date=20221111T012323, end_date=20221111T012329 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-08-21T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:23:29.498214Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d5136835-448f-4259-b575-5064439e964a"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..89ddd407 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:23:58.938055Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8fd50a34-ae45-3c50-a327-6ebfc346834e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8fd50a34-ae45-3c50-a327-6ebfc346834e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "52c4a2ae-d938-4af7-82c6-e37b50a6e55f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-08-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:23:58.938055+00:00, try_number=1, job_id=1098, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-22 00:00:00+00:00 +INFO - Started process 8693 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-08-22T00:00:00+00:00', '--job-id', '1098', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp_8kyyges'] +INFO - Job 1098: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNComahue_dag_elt - universidad carrera ... codigo_postal correo_electronico +0 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN PSICOLOGÍA ... 5315 FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE FARMACIA ... 8305 TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 3428 RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE MEDICINA ... 5873 ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE LICENCIATURA EN CIENCIA POLÍTICA ... 1765 FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180822T000000, start_date=20221111T012358, end_date=20221111T012403 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-08-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:24:03.737463Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "52c4a2ae-d938-4af7-82c6-e37b50a6e55f"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..17c9e8e4 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:23:58.945483Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8fd50a34-ae45-3c50-a327-6ebfc346834e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8fd50a34-ae45-3c50-a327-6ebfc346834e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "caed49c8-4b5c-474e-80cf-c2167439f3f2"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-08-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:23:58.945483+00:00, try_number=1, job_id=1097, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-22 00:00:00+00:00 +INFO - Started process 8694 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-08-22T00:00:00+00:00', '--job-id', '1097', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp6clt61_c'] +INFO - Job 1097: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180822T000000, start_date=20221111T012358, end_date=20221111T012403 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-08-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:24:03.488898Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "caed49c8-4b5c-474e-80cf-c2167439f3f2"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..d2cb5a9f --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,122 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:24:22.729044Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8fd50a34-ae45-3c50-a327-6ebfc346834e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8fd50a34-ae45-3c50-a327-6ebfc346834e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "585c4da8-b519-4d63-b1b0-862e6faa9395"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-08-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:24:22.729044+00:00, try_number=1, job_id=1101, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-22 00:00:00+00:00 +INFO - Started process 8508 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-08-22T00:00:00+00:00', '--job-id', '1101', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpfxe4ippx'] +INFO - Job 1101: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1a42983a4dbb +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-11' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-11' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-11' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-11' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-11' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-11' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fe2f4fa5940> +INFO - '2022-11-11' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-11' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-11' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-11' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-11' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-11' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-11' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-11' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'flX8mrQqB2AhjRuoQiGGgQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-11' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-11' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-11' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-11' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:flX8mrQqB2AhjRuoQiGGgQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221111T012423Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-11' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221111T012423Z +20221111/us-east-1/s3/aws4_request +760b431f55f37930e3a23b841189fba37bce40c81493913c4d05947221b0c998 +INFO - '2022-11-11' - botocore.auth - Signature: +84f8f7e2634d98ae5dd1e37ed24bd73ad03b6a4f6e0a11ffb86bfbb78e56947f +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.endpoint - Sending http request: +INFO - '2022-11-11' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-11' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-11' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-11' - botocore.parsers - Response headers: {'x-amz-id-2': 'aSigNoUbsjD5OtW35B2pucyCIbGwtvMio0mETPZt0nsfctPBxS9BnAgzXzeieLuHrxH7KXtIu+BqcqmeNsxFjg==', 'x-amz-request-id': 'FXG9VYK8FVYGZDCW', 'Date': 'Fri, 11 Nov 2022 01:24:24 GMT', 'ETag': '"7e55fc9ab42a0760218d1ba842218681"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-11' - botocore.parsers - Response body: +b'' +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-11' - botocore.retryhandler - No retry needed. +INFO - '2022-11-11' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-11' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180822T000000, start_date=20221111T012422, end_date=20221111T012425 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-08-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:24:25.522168Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "585c4da8-b519-4d63-b1b0-862e6faa9395"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..b1103ed5 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,36 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:24:08.319638Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8fd50a34-ae45-3c50-a327-6ebfc346834e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8fd50a34-ae45-3c50-a327-6ebfc346834e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cfd41760-915e-480a-a0b5-2d63e4a6f701"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-08-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:24:08.319638+00:00, try_number=1, job_id=1099, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-22 00:00:00+00:00 +INFO - Started process 8709 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-08-22T00:00:00+00:00', '--job-id', '1099', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpw4p_ni5_'] +INFO - Job 1099: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180822T000000, start_date=20221111T012408, end_date=20221111T012420 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-08-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:24:20.292938Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cfd41760-915e-480a-a0b5-2d63e4a6f701"}} diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..137119d2 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-22T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-11T01:24:08.343873Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-22T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8fd50a34-ae45-3c50-a327-6ebfc346834e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8fd50a34-ae45-3c50-a327-6ebfc346834e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "63db2723-fd3f-4e26-922f-165de71bf9d7"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-08-22T00:00:00+00:00, map_index=-1, run_start_date=2022-11-11 01:24:08.343873+00:00, try_number=1, job_id=1100, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-22 00:00:00+00:00 +INFO - Started process 8707 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-08-22T00:00:00+00:00', '--job-id', '1100', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp1qfz4q15'] +INFO - Job 1100: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 5bee9a49f133 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-22T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-22T00:00:00+00:00 +INFO - '2022-11-11' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-11' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-11' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-11' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180822T000000, start_date=20221111T012408, end_date=20221111T012412 +INFO - '2022-11-11' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-11' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-11' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-08-22T00:00:00+00:00 +INFO - '2022-11-11' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-11' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-11' - openlineage.client.transport.console - {"eventTime": "2022-11-11T01:24:12.881263Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "63db2723-fd3f-4e26-922f-165de71bf9d7"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..d3782e34 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:17:18.161870Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3fe9b6d3-6ce0-3bdd-af73-3c9cec1e4170"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3fe9b6d3-6ce0-3bdd-af73-3c9cec1e4170"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e4b23aaf-86de-4d7e-8461-4b162180ed8a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-08-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:17:18.161870+00:00, try_number=1, job_id=1105, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-23 00:00:00+00:00 +INFO - Started process 177 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-08-23T00:00:00+00:00', '--job-id', '1105', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpgn9dnmk_'] +INFO - Job 1105: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-23T00:00:00+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-12' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-12' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-12' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180823T000000, start_date=20221112T231718, end_date=20221112T231722 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-08-23T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:17:22.746356Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e4b23aaf-86de-4d7e-8461-4b162180ed8a"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..fc00cb00 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:17:17.465871Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3fe9b6d3-6ce0-3bdd-af73-3c9cec1e4170"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3fe9b6d3-6ce0-3bdd-af73-3c9cec1e4170"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ca6081e6-9ad5-4415-bfda-b0be23e6bbb1"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-08-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:17:17.465871+00:00, try_number=1, job_id=1104, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-23 00:00:00+00:00 +INFO - Started process 174 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-08-23T00:00:00+00:00', '--job-id', '1104', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmps42kdzbu'] +INFO - Job 1104: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-23T00:00:00+00:00 +INFO - '2022-11-12' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-12' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180823T000000, start_date=20221112T231717, end_date=20221112T231722 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-08-23T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:17:22.724195Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ca6081e6-9ad5-4415-bfda-b0be23e6bbb1"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..59a5b6a8 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,257 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:17:39.053900Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3fe9b6d3-6ce0-3bdd-af73-3c9cec1e4170"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3fe9b6d3-6ce0-3bdd-af73-3c9cec1e4170"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "62ca286a-f8c2-42b4-b887-50980b509c88"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-08-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:17:39.053900+00:00, try_number=1, job_id=1109, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-23 00:00:00+00:00 +INFO - Started process 201 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-08-23T00:00:00+00:00', '--job-id', '1109', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp1i3xdue1'] +INFO - Job 1109: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-23T00:00:00+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-12' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-12' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-12' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-12' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-12' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fd8770d2f70> +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-12' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-12' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNComahue_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - Marking task as UP_FOR_RETRY. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180823T000000, start_date=20221112T231739, end_date=20221112T231740 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 1109 for task Load_B1 (Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$"; 201) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=2.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=2.log" new file mode 100644 index 00000000..ed72f289 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=2.log" @@ -0,0 +1,262 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 2 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:22:44.647556Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3fe9b6d3-6ce0-3bdd-af73-3c9cec1e4170"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3fe9b6d3-6ce0-3bdd-af73-3c9cec1e4170"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5d1187c3-883d-46c2-88b9-d3b76b9708bc"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-08-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:22:44.647556+00:00, try_number=2, job_id=1117, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-23 00:00:00+00:00 +INFO - Started process 273 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-08-23T00:00:00+00:00', '--job-id', '1117', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpemt8e5me'] +INFO - Job 1117: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=2 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-23T00:00:00+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-12' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-12' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-12' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-12' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-12' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fd8770ef5e0> +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-12' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-12' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNComahue_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - Marking task as FAILED. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180823T000000, start_date=20221112T232244, end_date=20221112T232246 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance failure +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-08-23T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:22:46.472134Z", "eventType": "FAIL", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5d1187c3-883d-46c2-88b9-d3b76b9708bc"}} +ERROR - Failed to execute job 1117 for task Load_B1 (Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$"; 273) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..0b9a0670 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,257 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:17:35.372265Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3fe9b6d3-6ce0-3bdd-af73-3c9cec1e4170"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3fe9b6d3-6ce0-3bdd-af73-3c9cec1e4170"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "732477c2-bc0c-438f-83e7-dea26806564a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-08-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:17:35.372265+00:00, try_number=1, job_id=1108, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-23 00:00:00+00:00 +INFO - Started process 194 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-08-23T00:00:00+00:00', '--job-id', '1108', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpmhqo314g'] +INFO - Job 1108: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-23T00:00:00+00:00 +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-12' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-12' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-12' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-12' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fd8770d1a60> +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-12' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-12' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNSalvador_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - Marking task as UP_FOR_RETRY. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180823T000000, start_date=20221112T231735, end_date=20221112T231737 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 1108 for task Load_B2 (Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$"; 194) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=2.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=2.log" new file mode 100644 index 00000000..7eed5bc3 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=2.log" @@ -0,0 +1,262 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 2 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:22:43.876755Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3fe9b6d3-6ce0-3bdd-af73-3c9cec1e4170"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3fe9b6d3-6ce0-3bdd-af73-3c9cec1e4170"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d4e20e99-2741-4286-86d8-be287ddac366"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-08-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:22:43.876755+00:00, try_number=2, job_id=1116, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-23 00:00:00+00:00 +INFO - Started process 270 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-08-23T00:00:00+00:00', '--job-id', '1116', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpa2rq7h1u'] +INFO - Job 1116: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=2 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-23T00:00:00+00:00 +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-12' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-12' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-12' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-12' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fd8770d1f70> +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-12' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-12' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNSalvador_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - Marking task as FAILED. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180823T000000, start_date=20221112T232243, end_date=20221112T232246 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance failure +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-08-23T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:22:46.204924Z", "eventType": "FAIL", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d4e20e99-2741-4286-86d8-be287ddac366"}} +ERROR - Failed to execute job 1116 for task Load_B2 (Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$"; 270) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..3c3c9185 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:17:26.166543Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3fe9b6d3-6ce0-3bdd-af73-3c9cec1e4170"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3fe9b6d3-6ce0-3bdd-af73-3c9cec1e4170"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a34b37cf-e153-40e2-b2d5-d85aa63a8746"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-08-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:17:26.166543+00:00, try_number=1, job_id=1106, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-23 00:00:00+00:00 +INFO - Started process 184 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-08-23T00:00:00+00:00', '--job-id', '1106', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpx1r2ousi'] +INFO - Job 1106: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-23T00:00:00+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180823T000000, start_date=20221112T231726, end_date=20221112T231736 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-08-23T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:17:36.515925Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a34b37cf-e153-40e2-b2d5-d85aa63a8746"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..1b5453b4 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-23T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:17:26.852480Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-23T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3fe9b6d3-6ce0-3bdd-af73-3c9cec1e4170"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "3fe9b6d3-6ce0-3bdd-af73-3c9cec1e4170"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9f17cc75-c8f8-4a71-a3e7-de38c0f2468b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-08-23T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:17:26.852480+00:00, try_number=1, job_id=1107, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-23 00:00:00+00:00 +INFO - Started process 187 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-08-23T00:00:00+00:00', '--job-id', '1107', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpq2sf195k'] +INFO - Job 1107: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-23T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-23T00:00:00+00:00 +INFO - '2022-11-12' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-12' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180823T000000, start_date=20221112T231726, end_date=20221112T231731 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-08-23T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:17:31.939581Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9f17cc75-c8f8-4a71-a3e7-de38c0f2468b"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..d7cabeaa --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:22:49.754927Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "173e8b50-ba0d-38d5-abb3-9123afb23846"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "173e8b50-ba0d-38d5-abb3-9123afb23846"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1759a536-cb44-4dd2-a009-8823a0746c35"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-08-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:22:49.754927+00:00, try_number=1, job_id=1119, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-24 00:00:00+00:00 +INFO - Started process 287 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-08-24T00:00:00+00:00', '--job-id', '1119', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpfa9rvlrp'] +INFO - Job 1119: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-24T00:00:00+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-12' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-12' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-12' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180824T000000, start_date=20221112T232249, end_date=20221112T232255 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-08-24T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:22:55.252879Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1759a536-cb44-4dd2-a009-8823a0746c35"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..17151024 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:22:49.602368Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "173e8b50-ba0d-38d5-abb3-9123afb23846"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "173e8b50-ba0d-38d5-abb3-9123afb23846"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "596ad4d3-801b-4030-a8df-93526282a0a1"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-08-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:22:49.602368+00:00, try_number=1, job_id=1118, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-24 00:00:00+00:00 +INFO - Started process 285 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-08-24T00:00:00+00:00', '--job-id', '1118', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpsfxbrsfj'] +INFO - Job 1118: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-24T00:00:00+00:00 +INFO - '2022-11-12' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-12' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180824T000000, start_date=20221112T232249, end_date=20221112T232255 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-08-24T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:22:55.209060Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "596ad4d3-801b-4030-a8df-93526282a0a1"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..925977b7 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,257 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:23:18.154715Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "173e8b50-ba0d-38d5-abb3-9123afb23846"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "173e8b50-ba0d-38d5-abb3-9123afb23846"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5fb4a972-5249-4015-ad24-b328a0496460"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-08-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:23:18.154715+00:00, try_number=1, job_id=1123, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-24 00:00:00+00:00 +INFO - Started process 314 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-08-24T00:00:00+00:00', '--job-id', '1123', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp3rbvjtov'] +INFO - Job 1123: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-24T00:00:00+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-12' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-12' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-12' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-12' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-12' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fd8770ee0d0> +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-12' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-12' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNComahue_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - Marking task as UP_FOR_RETRY. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180824T000000, start_date=20221112T232318, end_date=20221112T232319 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 1123 for task Load_B1 (Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$"; 314) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=2.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=2.log" new file mode 100644 index 00000000..15d9a3c2 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=2.log" @@ -0,0 +1,262 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 2 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:28:21.838759Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "173e8b50-ba0d-38d5-abb3-9123afb23846"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "173e8b50-ba0d-38d5-abb3-9123afb23846"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f520a7b8-d8d4-405c-a825-c143ada5b835"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-08-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:28:21.838759+00:00, try_number=2, job_id=1125, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-24 00:00:00+00:00 +INFO - Started process 357 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-08-24T00:00:00+00:00', '--job-id', '1125', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp56dgi_sw'] +INFO - Job 1125: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=2 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-24T00:00:00+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-12' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-12' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-12' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-12' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-12' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fd8770d1ee0> +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-12' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-12' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNComahue_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - Marking task as FAILED. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180824T000000, start_date=20221112T232821, end_date=20221112T232822 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance failure +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-08-24T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:28:22.901940Z", "eventType": "FAIL", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f520a7b8-d8d4-405c-a825-c143ada5b835"}} +ERROR - Failed to execute job 1125 for task Load_B1 (Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$"; 357) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..e1168f14 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,257 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:23:06.965841Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "173e8b50-ba0d-38d5-abb3-9123afb23846"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "173e8b50-ba0d-38d5-abb3-9123afb23846"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f4fc1b68-563a-46bb-8467-f943aadd076f"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-08-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:23:06.965841+00:00, try_number=1, job_id=1122, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-24 00:00:00+00:00 +INFO - Started process 302 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-08-24T00:00:00+00:00', '--job-id', '1122', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpjwc49sjv'] +INFO - Job 1122: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-24T00:00:00+00:00 +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-12' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-12' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-12' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-12' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fd8770cff70> +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-12' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-12' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNSalvador_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - Marking task as UP_FOR_RETRY. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180824T000000, start_date=20221112T232306, end_date=20221112T232308 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 1122 for task Load_B2 (Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$"; 302) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=2.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=2.log" new file mode 100644 index 00000000..b338430e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=2.log" @@ -0,0 +1,262 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 2 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:28:10.657455Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "173e8b50-ba0d-38d5-abb3-9123afb23846"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "173e8b50-ba0d-38d5-abb3-9123afb23846"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "16e54322-a501-43ec-83eb-ff9f85e0fb81"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-08-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:28:10.657455+00:00, try_number=2, job_id=1124, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-24 00:00:00+00:00 +INFO - Started process 345 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-08-24T00:00:00+00:00', '--job-id', '1124', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmptvfc5rdz'] +INFO - Job 1124: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=2 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-24T00:00:00+00:00 +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-12' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-12' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-12' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-12' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fd8770ef5e0> +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-12' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-12' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNSalvador_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - Marking task as FAILED. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180824T000000, start_date=20221112T232810, end_date=20221112T232811 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance failure +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-08-24T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:28:11.842853Z", "eventType": "FAIL", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "16e54322-a501-43ec-83eb-ff9f85e0fb81"}} +ERROR - Failed to execute job 1124 for task Load_B2 (Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$"; 345) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..d0177a61 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:23:00.070985Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "173e8b50-ba0d-38d5-abb3-9123afb23846"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "173e8b50-ba0d-38d5-abb3-9123afb23846"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c1785497-5766-42df-8709-afa840fc8edd"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-08-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:23:00.070985+00:00, try_number=1, job_id=1121, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-24 00:00:00+00:00 +INFO - Started process 297 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-08-24T00:00:00+00:00', '--job-id', '1121', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp_5hd9yvd'] +INFO - Job 1121: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-24T00:00:00+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180824T000000, start_date=20221112T232300, end_date=20221112T232311 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-08-24T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:23:11.937493Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c1785497-5766-42df-8709-afa840fc8edd"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..7edc7a7c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-24T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:22:59.437983Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-24T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "173e8b50-ba0d-38d5-abb3-9123afb23846"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "173e8b50-ba0d-38d5-abb3-9123afb23846"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3b23db31-4467-4a79-930c-8244e36036e3"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-08-24T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:22:59.437983+00:00, try_number=1, job_id=1120, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-24 00:00:00+00:00 +INFO - Started process 294 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-08-24T00:00:00+00:00', '--job-id', '1120', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpt6l0i0wh'] +INFO - Job 1120: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-24T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-24T00:00:00+00:00 +INFO - '2022-11-12' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-12' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180824T000000, start_date=20221112T232259, end_date=20221112T232303 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-08-24T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:23:03.983681Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3b23db31-4467-4a79-930c-8244e36036e3"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..1573dd23 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:28:26.468382Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "05dd5574-fd22-3ae6-bc46-49b16db334f9"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "05dd5574-fd22-3ae6-bc46-49b16db334f9"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "51cbd137-0f3d-46ad-9fc2-837612f87416"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-08-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:28:26.468382+00:00, try_number=1, job_id=1127, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-25 00:00:00+00:00 +INFO - Started process 368 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-08-25T00:00:00+00:00', '--job-id', '1127', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp98vt1ovz'] +INFO - Job 1127: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-25T00:00:00+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-12' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-12' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-12' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180825T000000, start_date=20221112T232826, end_date=20221112T232830 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-08-25T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:28:30.321478Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "51cbd137-0f3d-46ad-9fc2-837612f87416"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..340d61fb --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:28:26.330740Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "05dd5574-fd22-3ae6-bc46-49b16db334f9"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "05dd5574-fd22-3ae6-bc46-49b16db334f9"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4ac78111-4759-4de5-a7db-24668eba1152"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-08-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:28:26.330740+00:00, try_number=1, job_id=1126, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-25 00:00:00+00:00 +INFO - Started process 366 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-08-25T00:00:00+00:00', '--job-id', '1126', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpoeam_zmq'] +INFO - Job 1126: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-25T00:00:00+00:00 +INFO - '2022-11-12' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-12' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180825T000000, start_date=20221112T232826, end_date=20221112T232830 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-08-25T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:28:30.265945Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4ac78111-4759-4de5-a7db-24668eba1152"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..7d7df25d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,257 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:28:46.593575Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "05dd5574-fd22-3ae6-bc46-49b16db334f9"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "05dd5574-fd22-3ae6-bc46-49b16db334f9"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "aa514a36-84ec-4965-a036-7e97e763c47b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-08-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:28:46.593575+00:00, try_number=1, job_id=1131, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-25 00:00:00+00:00 +INFO - Started process 390 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-08-25T00:00:00+00:00', '--job-id', '1131', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpks5wvoup'] +INFO - Job 1131: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-25T00:00:00+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-12' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-12' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-12' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-12' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-12' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fd8770ef550> +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-12' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-12' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNComahue_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - Marking task as UP_FOR_RETRY. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180825T000000, start_date=20221112T232846, end_date=20221112T232848 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 1131 for task Load_B1 (Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$"; 390) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=2.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=2.log" new file mode 100644 index 00000000..980ba27c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=2.log" @@ -0,0 +1,262 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 2 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:33:52.515112Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "05dd5574-fd22-3ae6-bc46-49b16db334f9"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "05dd5574-fd22-3ae6-bc46-49b16db334f9"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5b0f9738-e489-4638-8d14-b67caf71f4bc"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-08-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:33:52.515112+00:00, try_number=2, job_id=1135, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-25 00:00:00+00:00 +INFO - Started process 445 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-08-25T00:00:00+00:00', '--job-id', '1135', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpj3fg0c5w'] +INFO - Job 1135: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=2 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-25T00:00:00+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-12' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-12' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-12' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-12' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-12' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fd8770d3f70> +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-12' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-12' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNComahue_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - Marking task as FAILED. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180825T000000, start_date=20221112T233352, end_date=20221112T233353 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance failure +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-08-25T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:33:53.999643Z", "eventType": "FAIL", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5b0f9738-e489-4638-8d14-b67caf71f4bc"}} +ERROR - Failed to execute job 1135 for task Load_B1 (Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$"; 445) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..9a95ef5d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,257 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:28:42.091777Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "05dd5574-fd22-3ae6-bc46-49b16db334f9"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "05dd5574-fd22-3ae6-bc46-49b16db334f9"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c819c3db-24b7-4ea3-bff6-45d1986a5686"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-08-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:28:42.091777+00:00, try_number=1, job_id=1130, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-25 00:00:00+00:00 +INFO - Started process 383 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-08-25T00:00:00+00:00', '--job-id', '1130', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpeumig50j'] +INFO - Job 1130: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-25T00:00:00+00:00 +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-12' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-12' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-12' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-12' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fd8770ef0d0> +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-12' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-12' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNSalvador_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - Marking task as UP_FOR_RETRY. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180825T000000, start_date=20221112T232842, end_date=20221112T232843 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 1130 for task Load_B2 (Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$"; 383) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=2.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=2.log" new file mode 100644 index 00000000..807883ac --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=2.log" @@ -0,0 +1,262 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 2 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:33:46.222964Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "05dd5574-fd22-3ae6-bc46-49b16db334f9"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "05dd5574-fd22-3ae6-bc46-49b16db334f9"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c5a95d1c-e412-4f82-835c-31da809c37ef"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-08-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:33:46.222964+00:00, try_number=2, job_id=1134, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-25 00:00:00+00:00 +INFO - Started process 438 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-08-25T00:00:00+00:00', '--job-id', '1134', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpo7axys3f'] +INFO - Job 1134: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=2 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-25T00:00:00+00:00 +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-12' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-12' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-12' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-12' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fd8770d1f70> +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-12' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-12' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNSalvador_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - Marking task as FAILED. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180825T000000, start_date=20221112T233346, end_date=20221112T233347 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance failure +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-08-25T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:33:47.590935Z", "eventType": "FAIL", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c5a95d1c-e412-4f82-835c-31da809c37ef"}} +ERROR - Failed to execute job 1134 for task Load_B2 (Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$"; 438) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..8c504482 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:28:34.058229Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "05dd5574-fd22-3ae6-bc46-49b16db334f9"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "05dd5574-fd22-3ae6-bc46-49b16db334f9"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "212d1635-35dc-4f55-8abe-99371133eacd"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-08-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:28:34.058229+00:00, try_number=1, job_id=1128, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-25 00:00:00+00:00 +INFO - Started process 375 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-08-25T00:00:00+00:00', '--job-id', '1128', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmphwpglh8a'] +INFO - Job 1128: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-25T00:00:00+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180825T000000, start_date=20221112T232834, end_date=20221112T232844 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-08-25T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:28:44.504618Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "212d1635-35dc-4f55-8abe-99371133eacd"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..01933319 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-25T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:28:34.560248Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-25T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "05dd5574-fd22-3ae6-bc46-49b16db334f9"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "05dd5574-fd22-3ae6-bc46-49b16db334f9"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "461093a9-9526-43ec-95d7-76882f4c5aea"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-08-25T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:28:34.560248+00:00, try_number=1, job_id=1129, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-25 00:00:00+00:00 +INFO - Started process 378 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-08-25T00:00:00+00:00', '--job-id', '1129', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpq5pqnfuz'] +INFO - Job 1129: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-25T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-25T00:00:00+00:00 +INFO - '2022-11-12' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-12' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180825T000000, start_date=20221112T232834, end_date=20221112T232839 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-08-25T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:28:39.206297Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "461093a9-9526-43ec-95d7-76882f4c5aea"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..715d3ea2 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:33:58.652591Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9e50f0c4-461d-3e66-8272-6e9840458f4a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9e50f0c4-461d-3e66-8272-6e9840458f4a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b2646924-120c-4342-b753-20a07893281d"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-08-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:33:58.652591+00:00, try_number=1, job_id=1137, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-26 00:00:00+00:00 +INFO - Started process 456 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-08-26T00:00:00+00:00', '--job-id', '1137', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpyoe0xavm'] +INFO - Job 1137: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-26T00:00:00+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-12' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-12' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-12' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180826T000000, start_date=20221112T233358, end_date=20221112T233403 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-08-26T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:34:03.052855Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b2646924-120c-4342-b753-20a07893281d"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..e5c19f4c --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:33:58.448379Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9e50f0c4-461d-3e66-8272-6e9840458f4a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9e50f0c4-461d-3e66-8272-6e9840458f4a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4d44238a-fdc7-4ef5-8310-a7572d63c8a6"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-08-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:33:58.448379+00:00, try_number=1, job_id=1136, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-26 00:00:00+00:00 +INFO - Started process 453 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-08-26T00:00:00+00:00', '--job-id', '1136', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp3hvg069p'] +INFO - Job 1136: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-26T00:00:00+00:00 +INFO - '2022-11-12' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-12' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180826T000000, start_date=20221112T233358, end_date=20221112T233403 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-08-26T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:34:03.051374Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "4d44238a-fdc7-4ef5-8310-a7572d63c8a6"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..c6d3d1ed --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,257 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:34:27.311718Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9e50f0c4-461d-3e66-8272-6e9840458f4a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9e50f0c4-461d-3e66-8272-6e9840458f4a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a07cc8ee-8bf3-42e8-b864-787ad2367d4b"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-08-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:34:27.311718+00:00, try_number=1, job_id=1141, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-26 00:00:00+00:00 +INFO - Started process 483 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-08-26T00:00:00+00:00', '--job-id', '1141', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp6qvq5m89'] +INFO - Job 1141: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-26T00:00:00+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-12' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-12' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-12' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-12' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-12' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fd8770d1f70> +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-12' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-12' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNComahue_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - Marking task as UP_FOR_RETRY. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180826T000000, start_date=20221112T233427, end_date=20221112T233428 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 1141 for task Load_B1 (Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$"; 483) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=2.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=2.log" new file mode 100644 index 00000000..9db92c8e --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=2.log" @@ -0,0 +1,262 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 2 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:39:31.621508Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9e50f0c4-461d-3e66-8272-6e9840458f4a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9e50f0c4-461d-3e66-8272-6e9840458f4a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "49218617-def4-4013-bc08-8bdbf50e8302"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-08-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:39:31.621508+00:00, try_number=2, job_id=1145, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-26 00:00:00+00:00 +INFO - Started process 538 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-08-26T00:00:00+00:00', '--job-id', '1145', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpi6wy7wi8'] +INFO - Job 1145: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=2 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-26T00:00:00+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-12' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-12' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-12' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-12' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-12' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fd8770f05e0> +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-12' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-12' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNComahue_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - Marking task as FAILED. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180826T000000, start_date=20221112T233931, end_date=20221112T233932 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance failure +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-08-26T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:39:32.484900Z", "eventType": "FAIL", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "49218617-def4-4013-bc08-8bdbf50e8302"}} +ERROR - Failed to execute job 1145 for task Load_B1 (Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$"; 538) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..5a01766a --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,257 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:34:20.027435Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9e50f0c4-461d-3e66-8272-6e9840458f4a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9e50f0c4-461d-3e66-8272-6e9840458f4a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3e29d51e-dfeb-4398-bc33-21dc91048122"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-08-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:34:20.027435+00:00, try_number=1, job_id=1140, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-26 00:00:00+00:00 +INFO - Started process 476 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-08-26T00:00:00+00:00', '--job-id', '1140', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp_c46_4np'] +INFO - Job 1140: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-26T00:00:00+00:00 +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-12' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-12' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-12' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-12' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fd8770ef0d0> +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-12' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-12' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNSalvador_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - Marking task as UP_FOR_RETRY. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180826T000000, start_date=20221112T233420, end_date=20221112T233422 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 1140 for task Load_B2 (Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$"; 476) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=2.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=2.log" new file mode 100644 index 00000000..5d5e6faf --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=2.log" @@ -0,0 +1,262 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 2 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:39:25.091630Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9e50f0c4-461d-3e66-8272-6e9840458f4a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9e50f0c4-461d-3e66-8272-6e9840458f4a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9951a901-4ad1-465d-b358-5e4d37794dd4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-08-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:39:25.091630+00:00, try_number=2, job_id=1144, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-26 00:00:00+00:00 +INFO - Started process 526 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-08-26T00:00:00+00:00', '--job-id', '1144', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpedgu50n5'] +INFO - Job 1144: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=2 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-26T00:00:00+00:00 +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-12' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-12' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-12' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-12' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fd8770ed5e0> +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-12' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-12' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNSalvador_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - Marking task as FAILED. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180826T000000, start_date=20221112T233925, end_date=20221112T233925 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance failure +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-08-26T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:39:25.918670Z", "eventType": "FAIL", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9951a901-4ad1-465d-b358-5e4d37794dd4"}} +ERROR - Failed to execute job 1144 for task Load_B2 (Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$"; 526) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..e8c31d57 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:34:06.970050Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9e50f0c4-461d-3e66-8272-6e9840458f4a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9e50f0c4-461d-3e66-8272-6e9840458f4a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "332339da-af72-445c-bdf1-440c5fe97f28"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-08-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:34:06.970050+00:00, try_number=1, job_id=1138, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-26 00:00:00+00:00 +INFO - Started process 463 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-08-26T00:00:00+00:00', '--job-id', '1138', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpq34x381c'] +INFO - Job 1138: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-26T00:00:00+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180826T000000, start_date=20221112T233406, end_date=20221112T233423 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-08-26T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:34:23.668135Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "332339da-af72-445c-bdf1-440c5fe97f28"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..a995d754 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-26T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:34:09.284506Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-26T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9e50f0c4-461d-3e66-8272-6e9840458f4a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "9e50f0c4-461d-3e66-8272-6e9840458f4a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "22a727ec-d51e-43d9-8bbd-61e327d9b3c2"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-08-26T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:34:09.284506+00:00, try_number=1, job_id=1139, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-26 00:00:00+00:00 +INFO - Started process 466 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-08-26T00:00:00+00:00', '--job-id', '1139', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp1trskllp'] +INFO - Job 1139: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-26T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-26T00:00:00+00:00 +INFO - '2022-11-12' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-12' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180826T000000, start_date=20221112T233409, end_date=20221112T233416 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-08-26T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:34:16.411480Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "22a727ec-d51e-43d9-8bbd-61e327d9b3c2"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..bc9d561d --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:39:37.622199Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8d5c998e-957d-3f58-bef5-b68759af1048"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8d5c998e-957d-3f58-bef5-b68759af1048"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2662734c-a4a3-46d7-b13a-b7eb931e3cbd"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-08-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:39:37.622199+00:00, try_number=1, job_id=1147, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-27 00:00:00+00:00 +INFO - Started process 549 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-08-27T00:00:00+00:00', '--job-id', '1147', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp1jojq62t'] +INFO - Job 1147: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-27T00:00:00+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-12' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-12' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-12' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180827T000000, start_date=20221112T233937, end_date=20221112T233941 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-08-27T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:39:41.406655Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2662734c-a4a3-46d7-b13a-b7eb931e3cbd"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..89a226af --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:39:36.920616Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8d5c998e-957d-3f58-bef5-b68759af1048"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8d5c998e-957d-3f58-bef5-b68759af1048"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "74184f44-aaec-403a-ab93-ffe35c2c76f4"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-08-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:39:36.920616+00:00, try_number=1, job_id=1146, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-27 00:00:00+00:00 +INFO - Started process 546 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-08-27T00:00:00+00:00', '--job-id', '1146', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmprnmasfbq'] +INFO - Job 1146: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-27T00:00:00+00:00 +INFO - '2022-11-12' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-12' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180827T000000, start_date=20221112T233936, end_date=20221112T233940 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-08-27T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:39:40.965602Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "74184f44-aaec-403a-ab93-ffe35c2c76f4"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..91b379b4 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,257 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:40:04.422682Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8d5c998e-957d-3f58-bef5-b68759af1048"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8d5c998e-957d-3f58-bef5-b68759af1048"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d4302924-e3a2-487c-9c04-4a6e10e35829"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-08-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:40:04.422682+00:00, try_number=1, job_id=1151, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-27 00:00:00+00:00 +INFO - Started process 571 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-08-27T00:00:00+00:00', '--job-id', '1151', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmptgwx6xqf'] +INFO - Job 1151: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-27T00:00:00+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-12' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-12' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-12' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-12' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-12' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fd8770d0f70> +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-12' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-12' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNComahue_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - Marking task as UP_FOR_RETRY. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180827T000000, start_date=20221112T234004, end_date=20221112T234006 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 1151 for task Load_B1 (Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$"; 571) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=2.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=2.log" new file mode 100644 index 00000000..2097ed22 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=2.log" @@ -0,0 +1,262 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 2 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:45:09.056151Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8d5c998e-957d-3f58-bef5-b68759af1048"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8d5c998e-957d-3f58-bef5-b68759af1048"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "503d99e6-bf66-4e34-8b60-68b6b7b97b08"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-08-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:45:09.056151+00:00, try_number=2, job_id=1153, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-27 00:00:00+00:00 +INFO - Started process 614 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-08-27T00:00:00+00:00', '--job-id', '1153', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpm754de53'] +INFO - Job 1153: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=2 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-27T00:00:00+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-12' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-12' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-12' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-12' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-12' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fd8770d1f70> +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-12' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-12' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNComahue_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - Marking task as FAILED. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180827T000000, start_date=20221112T234509, end_date=20221112T234510 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance failure +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B1 airflow_run_id=scheduled__2018-08-27T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Load_B1: TaskMetadata(name='ETL_dag.Load_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B1'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:45:10.041642Z", "eventType": "FAIL", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "503d99e6-bf66-4e34-8b60-68b6b7b97b08"}} +ERROR - Failed to execute job 1153 for task Load_B1 (Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$"; 614) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..bdd422e6 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,257 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:39:52.702927Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8d5c998e-957d-3f58-bef5-b68759af1048"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8d5c998e-957d-3f58-bef5-b68759af1048"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0f6f9dbd-6d6f-4ec2-95a0-f7ac59e30c42"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-08-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:39:52.702927+00:00, try_number=1, job_id=1150, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-27 00:00:00+00:00 +INFO - Started process 564 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-08-27T00:00:00+00:00', '--job-id', '1150', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp_t6h_f8t'] +INFO - Job 1150: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-27T00:00:00+00:00 +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-12' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-12' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-12' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-12' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fd8770d0f70> +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-12' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-12' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNSalvador_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - Marking task as UP_FOR_RETRY. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180827T000000, start_date=20221112T233952, end_date=20221112T233954 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 1150 for task Load_B2 (Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$"; 564) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=2.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=2.log" new file mode 100644 index 00000000..ccdd0c26 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=2.log" @@ -0,0 +1,262 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 2 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:44:57.754392Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8d5c998e-957d-3f58-bef5-b68759af1048"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8d5c998e-957d-3f58-bef5-b68759af1048"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "56d0c059-ec56-4ec8-a557-623cab10ade8"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-08-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:44:57.754392+00:00, try_number=2, job_id=1152, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-27 00:00:00+00:00 +INFO - Started process 607 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-08-27T00:00:00+00:00', '--job-id', '1152', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpxxlyyct7'] +INFO - Job 1152: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=2 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-27T00:00:00+00:00 +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-12' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-12' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-12' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-12' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fd8770d1ee0> +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-12' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-12' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNSalvador_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - Marking task as FAILED. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180827T000000, start_date=20221112T234457, end_date=20221112T234459 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance failure +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Load_B2 airflow_run_id=scheduled__2018-08-27T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Load_B2: TaskMetadata(name='ETL_dag.Load_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Load_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Load_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Transform_B2'}, 'downstream_task_ids': set(), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:44:59.159772Z", "eventType": "FAIL", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "56d0c059-ec56-4ec8-a557-623cab10ade8"}} +ERROR - Failed to execute job 1152 for task Load_B2 (Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$"; 607) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..80a561fc --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:39:44.184508Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8d5c998e-957d-3f58-bef5-b68759af1048"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8d5c998e-957d-3f58-bef5-b68759af1048"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "94b56f6a-52a2-42dc-a0e9-b04f2b412fc3"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-08-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:39:44.184508+00:00, try_number=1, job_id=1149, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-27 00:00:00+00:00 +INFO - Started process 559 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-08-27T00:00:00+00:00', '--job-id', '1149', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpdpgvryjn'] +INFO - Job 1149: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-27T00:00:00+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180827T000000, start_date=20221112T233944, end_date=20221112T234000 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-08-27T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:40:00.580413Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "94b56f6a-52a2-42dc-a0e9-b04f2b412fc3"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..2262ba19 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-27T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:39:44.124366Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-27T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8d5c998e-957d-3f58-bef5-b68759af1048"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "8d5c998e-957d-3f58-bef5-b68759af1048"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "26f6738d-73e3-45b7-878a-58936fa8185a"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-08-27T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:39:44.124366+00:00, try_number=1, job_id=1148, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-27 00:00:00+00:00 +INFO - Started process 557 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-08-27T00:00:00+00:00', '--job-id', '1148', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpv057artm'] +INFO - Job 1148: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-27T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-27T00:00:00+00:00 +INFO - '2022-11-12' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-12' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180827T000000, start_date=20221112T233944, end_date=20221112T233949 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-08-27T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:39:49.382042Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "26f6738d-73e3-45b7-878a-58936fa8185a"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" new file mode 100644 index 00000000..bf06fac3 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B1/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:45:14.852160Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "81755ac3-ac96-3f27-9103-8eecbafac0fc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "81755ac3-ac96-3f27-9103-8eecbafac0fc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b30d24e0-3cc4-459a-86af-95025dfef6e2"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B1, dagrun_id=scheduled__2018-08-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:45:14.852160+00:00, try_number=1, job_id=1155, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-28 00:00:00+00:00 +INFO - Started process 625 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B1', 'scheduled__2018-08-28T00:00:00+00:00', '--job-id', '1155', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpwraguso9'] +INFO - Job 1155: Subtask Extract_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-28T00:00:00+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-12' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-12' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-12' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B1, execution_date=20180828T000000, start_date=20221112T234514, end_date=20221112T234518 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B1 airflow_run_id=scheduled__2018-08-28T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Extract_B1: TaskMetadata(name='ETL_dag.Extract_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:45:18.941891Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b30d24e0-3cc4-459a-86af-95025dfef6e2"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" new file mode 100644 index 00000000..736fb508 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Extract_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:45:14.435479Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Transform_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "81755ac3-ac96-3f27-9103-8eecbafac0fc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "81755ac3-ac96-3f27-9103-8eecbafac0fc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "37022b0f-3e57-4d27-b5a2-d9c903c349aa"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Extract_B2, dagrun_id=scheduled__2018-08-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:45:14.435479+00:00, try_number=1, job_id=1154, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-28 00:00:00+00:00 +INFO - Started process 622 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Extract_B2', 'scheduled__2018-08-28T00:00:00+00:00', '--job-id', '1154', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp0z8s_9ti'] +INFO - Job 1154: Subtask Extract_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Extract_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-28T00:00:00+00:00 +INFO - '2022-11-12' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-12' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Extract_B2, execution_date=20180828T000000, start_date=20221112T234514, end_date=20221112T234518 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Extract_B2 airflow_run_id=scheduled__2018-08-28T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Extract_B2: TaskMetadata(name='ETL_dag.Extract_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Extract_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Extract_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'Transform_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:45:18.790184Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Extract_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Extract_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Extract_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "37022b0f-3e57-4d27-b5a2-d9c903c349aa"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" new file mode 100644 index 00000000..6ed57fa6 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B1/attempt=1.log" @@ -0,0 +1,257 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:45:41.078311Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "81755ac3-ac96-3f27-9103-8eecbafac0fc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "81755ac3-ac96-3f27-9103-8eecbafac0fc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b9c1d5a5-fed8-40e5-bee3-8449af5a3cac"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B1, dagrun_id=scheduled__2018-08-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:45:41.078311+00:00, try_number=1, job_id=1159, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-28 00:00:00+00:00 +INFO - Started process 652 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B1', 'scheduled__2018-08-28T00:00:00+00:00', '--job-id', '1159', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp_x5oi4lz'] +INFO - Job 1159: Subtask Load_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-28T00:00:00+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-12' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-12' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-12' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-12' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-12' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fd8770d2f70> +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-12' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-12' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNComahue_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - Marking task as UP_FOR_RETRY. dag_id=ETL_dag, task_id=Load_B1, execution_date=20180828T000000, start_date=20221112T234541, end_date=20221112T234542 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 1159 for task Load_B1 (Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$"; 652) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" new file mode 100644 index 00000000..035f2662 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Load_B2/attempt=1.log" @@ -0,0 +1,257 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:45:32.076726Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Load_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Transform_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "81755ac3-ac96-3f27-9103-8eecbafac0fc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "81755ac3-ac96-3f27-9103-8eecbafac0fc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Load_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Load_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "573a5e2b-83d7-4d60-8fba-18ffe8df0ee0"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Load_B2, dagrun_id=scheduled__2018-08-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:45:32.076726+00:00, try_number=1, job_id=1158, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-28 00:00:00+00:00 +INFO - Started process 645 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Load_B2', 'scheduled__2018-08-28T00:00:00+00:00', '--job-id', '1158', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp9hj47dw7'] +INFO - Job 1158: Subtask Load_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Load_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-28T00:00:00+00:00 +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-12' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-12' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-12' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-12' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fd8770ed0d0> +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-12' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-12' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': '', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNSalvador_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - Marking task as UP_FOR_RETRY. dag_id=ETL_dag, task_id=Load_B2, execution_date=20180828T000000, start_date=20221112T234532, end_date=20221112T234533 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 1158 for task Load_B2 (Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$"; 645) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" new file mode 100644 index 00000000..9a4c5939 --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B1/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:45:22.284914Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B1'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B1'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "81755ac3-ac96-3f27-9103-8eecbafac0fc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "81755ac3-ac96-3f27-9103-8eecbafac0fc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "551d4281-1eb1-4b1a-8605-10a8daf5020c"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B1, dagrun_id=scheduled__2018-08-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:45:22.284914+00:00, try_number=1, job_id=1156, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-28 00:00:00+00:00 +INFO - Started process 634 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B1', 'scheduled__2018-08-28T00:00:00+00:00', '--job-id', '1156', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp7tfy33t8'] +INFO - Job 1156: Subtask Transform_B1 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B1 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-28T00:00:00+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B1, execution_date=20180828T000000, start_date=20221112T234522, end_date=20221112T234537 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B1 airflow_run_id=scheduled__2018-08-28T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Transform_B1: TaskMetadata(name='ETL_dag.Transform_B1', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B1', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B1', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B1'}, 'downstream_task_ids': {'Load_B1'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:45:37.873047Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B1", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B1"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B1", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "551d4281-1eb1-4b1a-8605-10a8daf5020c"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" new file mode 100644 index 00000000..5ecba84b --- /dev/null +++ "b/dags/logs/dag_id=ETL_dag/run_id=scheduled__2018-08-28T00\357\200\27200\357\200\27200+00\357\200\27200/task_id=Transform_B2/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 2 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:45:22.322153Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "owner": "BROC95", "python_callable": "", "retries": 1, "retry_delay": "0:05:00", "start_date": "2018-03-01T00:00:00+00:00", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "ETL_dag", "schedule_interval": "@daily"}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'Load_B2'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 1, "retry_delay": "0:05:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2018-03-01T00:00:00+00:00", "task_group": "", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": "{'Extract_B2'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2018-08-28T00:00:00.000000Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "81755ac3-ac96-3f27-9103-8eecbafac0fc"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "ETL_dag", "namespace": "default"}, "run": {"runId": "81755ac3-ac96-3f27-9103-8eecbafac0fc"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5d34445f-0b23-4e82-b197-22d9011883f0"}} +INFO - TaskInstance Details: dag_id=ETL_dag, task_id=Transform_B2, dagrun_id=scheduled__2018-08-28T00:00:00+00:00, map_index=-1, run_start_date=2022-11-12 23:45:22.322153+00:00, try_number=1, job_id=1157, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2018-08-28 00:00:00+00:00 +INFO - Started process 635 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'ETL_dag', 'Transform_B2', 'scheduled__2018-08-28T00:00:00+00:00', '--job-id', '1157', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp4axrtevv'] +INFO - Job 1157: Subtask Transform_B2 +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=BROC95 +AIRFLOW_CTX_DAG_ID=ETL_dag +AIRFLOW_CTX_TASK_ID=Transform_B2 +AIRFLOW_CTX_EXECUTION_DATE=2018-08-28T00:00:00+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2018-08-28T00:00:00+00:00 +INFO - '2022-11-12' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-12' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-12' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=ETL_dag, task_id=Transform_B2, execution_date=20180828T000000, start_date=20221112T234522, end_date=20221112T234526 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=ETL_dag task_id=Transform_B2 airflow_run_id=scheduled__2018-08-28T00:00:00+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation Transform_B2: TaskMetadata(name='ETL_dag.Transform_B2', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'Transform_B2', 'dag': , 'owner': 'BROC95', 'retries': 1, 'retry_delay': datetime.timedelta(seconds=300), 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'Transform_B2', 'task_group': , 'owner': 'BROC95', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'start_date': DateTime(2018, 3, 1, 0, 0, 0, tzinfo=Timezone('UTC')), 'executor_config': {}, 'run_as_user': None, 'retries': 1, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=300), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'Extract_B2'}, 'downstream_task_ids': {'Load_B2'}, 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:45:26.350773Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "ETL_dag.Transform_B2", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"dag": "<>", "owner": "BROC95", "python_callable": "<>", "retries": 1, "retry_delay": "<>", "start_date": "<>", "task_id": "Transform_B2"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "BROC95", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 1, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "Transform_B2", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5d34445f-0b23-4e82-b197-22d9011883f0"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27201\357\200\27202.522937+00\357\200\27200/task_id=TaskExtract/attempt=2.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27201\357\200\27202.522937+00\357\200\27200/task_id=TaskExtract/attempt=2.log" new file mode 100644 index 00000000..54365855 --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27201\357\200\27202.522937+00\357\200\27200/task_id=TaskExtract/attempt=2.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 2 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-09T19:11:15.582050Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-09T19:01:02.522937Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "9fe2da41-4121-3635-9034-751785358306"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "9fe2da41-4121-3635-9034-751785358306"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "187877d9-314c-4221-943d-8e65aa2d2926"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, dagrun_id=manual__2022-11-09T19:01:02.522937+00:00, map_index=-1, run_start_date=2022-11-09 19:11:15.582050+00:00, try_number=2, job_id=549, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-09 19:01:02.522937+00:00 +INFO - Started process 810 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskExtract', 'manual__2022-11-09T19:01:02.522937+00:00', '--job-id', '549', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmp9x5eczb4'] +INFO - Job 549: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 03a0f0f60b55 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-09T19:01:02.522937+00:00 +AIRFLOW_CTX_TRY_NUMBER=2 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-09T19:01:02.522937+00:00 +INFO - '2022-11-09' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-09' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-09' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-09' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-09' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-09' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, execution_date=20221109T190102, start_date=20221109T191115, end_date=20221109T191118 +INFO - '2022-11-09' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-09' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-09' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskExtract airflow_run_id=manual__2022-11-09T19:01:02.522937+00:00 +INFO - '2022-11-09' - root - Found task metadata for operation TaskExtract: TaskMetadata(name='GBUNComahue_dag_elt.TaskExtract', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskExtract', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskExtract', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'TaskTransform'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-09' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-09' - openlineage.client.transport.console - {"eventTime": "2022-11-09T19:11:18.859686Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "187877d9-314c-4221-943d-8e65aa2d2926"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27201\357\200\27202.522937+00\357\200\27200/task_id=TaskLoad/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27201\357\200\27202.522937+00\357\200\27200/task_id=TaskLoad/attempt=1.log" new file mode 100644 index 00000000..fc92b119 --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27201\357\200\27202.522937+00\357\200\27200/task_id=TaskLoad/attempt=1.log" @@ -0,0 +1,123 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-09T19:11:26.130922Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-09T19:01:02.522937Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "9fe2da41-4121-3635-9034-751785358306"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "9fe2da41-4121-3635-9034-751785358306"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cc9051fb-bfab-4446-a899-b97b644ded88"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, dagrun_id=manual__2022-11-09T19:01:02.522937+00:00, map_index=-1, run_start_date=2022-11-09 19:11:26.130922+00:00, try_number=1, job_id=552, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-09 19:01:02.522937+00:00 +INFO - Started process 873 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskLoad', 'manual__2022-11-09T19:01:02.522937+00:00', '--job-id', '552', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmpue_y05s3'] +INFO - Job 552: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 03a0f0f60b55 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-09T19:01:02.522937+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-09T19:01:02.522937+00:00 +INFO - '2022-11-09' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-09' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-09' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-09' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-09' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-09' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-09' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-09' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-09' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-09' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f289e6061f0> +INFO - '2022-11-09' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-09' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-09' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-09' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-09' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-09' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-09' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-09' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-09' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-09' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-09' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-09' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-09' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/preprocess/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'n7WYVuCprOw4VvaiWp/ywA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/preprocess/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-09' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/preprocess/GBUNComahue_process.txt +INFO - '2022-11-09' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/preprocess/GBUNComahue_process.txt +INFO - '2022-11-09' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-09' - botocore.auth - CanonicalRequest: +PUT +/preprocess/GBUNComahue_process.txt + +content-md5:n7WYVuCprOw4VvaiWp/ywA== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221109T191127Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-09' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221109T191127Z +20221109/us-east-1/s3/aws4_request +2cd62667efe4f233bba62187fe23d9d2457417870f8f12d92f8b3ae45e07b623 +INFO - '2022-11-09' - botocore.auth - Signature: +b60376642ba7669dad511fbeaee292b87b9d895fdc16f15e4df4e7b320bff7f0 +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.endpoint - Sending http request: +INFO - '2022-11-09' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-09' - urllib3.connectionpool - Starting new HTTPS connection (1): alkemy-2022-broc.s3.amazonaws.com:443 +INFO - '2022-11-09' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-09' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-09' - urllib3.connectionpool - https://alkemy-2022-broc.s3.amazonaws.com:443 "PUT /preprocess/GBUNComahue_process.txt HTTP/1.1" 200 0 +INFO - '2022-11-09' - botocore.parsers - Response headers: {'x-amz-id-2': '70aW8lrlUZ3On+baTJR0Vi6sIWcYtShd7f0pQcfp+sDIEzXlCCDaIYTCpV59ZPTVhTeZRHC43Pg=', 'x-amz-request-id': 'F84QM9CK62SDDS38', 'Date': 'Wed, 09 Nov 2022 19:11:26 GMT', 'ETag': '"9fb59856e0a9acec3856f6a25a9ff2c0"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-09' - botocore.parsers - Response body: +b'' +INFO - '2022-11-09' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.retryhandler - No retry needed. +INFO - '2022-11-09' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-09' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, execution_date=20221109T190102, start_date=20221109T191126, end_date=20221109T191128 +INFO - '2022-11-09' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-09' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-09' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskLoad airflow_run_id=manual__2022-11-09T19:01:02.522937+00:00 +INFO - '2022-11-09' - root - Found task metadata for operation TaskLoad: TaskMetadata(name='GBUNComahue_dag_elt.TaskLoad', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskLoad', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskLoad', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskTransform'}, 'downstream_task_ids': set(), 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-09' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-09' - openlineage.client.transport.console - {"eventTime": "2022-11-09T19:11:28.327885Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cc9051fb-bfab-4446-a899-b97b644ded88"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27201\357\200\27202.522937+00\357\200\27200/task_id=TaskTransform/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27201\357\200\27202.522937+00\357\200\27200/task_id=TaskTransform/attempt=1.log" new file mode 100644 index 00000000..7400e24e --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27201\357\200\27202.522937+00\357\200\27200/task_id=TaskTransform/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-09T19:11:20.109128Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskLoad'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskExtract'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-09T19:01:02.522937Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "9fe2da41-4121-3635-9034-751785358306"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "9fe2da41-4121-3635-9034-751785358306"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "25af37d0-855d-4d06-ba9b-2b6ebbe24eb8"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskTransform, dagrun_id=manual__2022-11-09T19:01:02.522937+00:00, map_index=-1, run_start_date=2022-11-09 19:11:20.109128+00:00, try_number=1, job_id=551, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-09 19:01:02.522937+00:00 +INFO - Started process 824 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskTransform', 'manual__2022-11-09T19:01:02.522937+00:00', '--job-id', '551', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmpu01hhuzx'] +INFO - Job 551: Subtask TaskTransform +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 03a0f0f60b55 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskTransform +AIRFLOW_CTX_EXECUTION_DATE=2022-11-09T19:01:02.522937+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-09T19:01:02.522937+00:00 +INFO - '2022-11-09' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskTransform, execution_date=20221109T190102, start_date=20221109T191120, end_date=20221109T191125 +INFO - '2022-11-09' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-09' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-09' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskTransform airflow_run_id=manual__2022-11-09T19:01:02.522937+00:00 +INFO - '2022-11-09' - root - Found task metadata for operation TaskTransform: TaskMetadata(name='GBUNComahue_dag_elt.TaskTransform', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskTransform', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskTransform', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskExtract'}, 'downstream_task_ids': {'TaskLoad'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-09' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-09' - openlineage.client.transport.console - {"eventTime": "2022-11-09T19:11:25.349554Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "25af37d0-855d-4d06-ba9b-2b6ebbe24eb8"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27210\357\200\27200.504114+00\357\200\27200/task_id=TaskExtract/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27210\357\200\27200.504114+00\357\200\27200/task_id=TaskExtract/attempt=1.log" new file mode 100644 index 00000000..ea5b728e --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27210\357\200\27200.504114+00\357\200\27200/task_id=TaskExtract/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-09T19:10:01.742252Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-09T19:10:00.504114Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "b38d3e79-bbd7-3630-a1ed-e2331d809d3a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "b38d3e79-bbd7-3630-a1ed-e2331d809d3a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bddbc244-d0d1-45e8-a21a-cfae9cc6b8e4"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, dagrun_id=manual__2022-11-09T19:10:00.504114+00:00, map_index=-1, run_start_date=2022-11-09 19:10:01.742252+00:00, try_number=1, job_id=543, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-09 19:10:00.504114+00:00 +INFO - Started process 671 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskExtract', 'manual__2022-11-09T19:10:00.504114+00:00', '--job-id', '543', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmp5gqh08ak'] +INFO - Job 543: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 03a0f0f60b55 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-09T19:10:00.504114+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-09T19:10:00.504114+00:00 +INFO - '2022-11-09' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-09' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-09' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-09' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-09' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-09' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, execution_date=20221109T191000, start_date=20221109T191001, end_date=20221109T191005 +INFO - '2022-11-09' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-09' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-09' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskExtract airflow_run_id=manual__2022-11-09T19:10:00.504114+00:00 +INFO - '2022-11-09' - root - Found task metadata for operation TaskExtract: TaskMetadata(name='GBUNComahue_dag_elt.TaskExtract', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskExtract', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskExtract', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'TaskTransform'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-09' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-09' - openlineage.client.transport.console - {"eventTime": "2022-11-09T19:10:05.747307Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bddbc244-d0d1-45e8-a21a-cfae9cc6b8e4"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27210\357\200\27200.504114+00\357\200\27200/task_id=TaskLoad/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27210\357\200\27200.504114+00\357\200\27200/task_id=TaskLoad/attempt=1.log" new file mode 100644 index 00000000..768aaa61 --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27210\357\200\27200.504114+00\357\200\27200/task_id=TaskLoad/attempt=1.log" @@ -0,0 +1,123 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-09T19:10:13.094086Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-09T19:10:00.504114Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "b38d3e79-bbd7-3630-a1ed-e2331d809d3a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "b38d3e79-bbd7-3630-a1ed-e2331d809d3a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "026314d4-103f-4d37-9ede-6e98ca38c76c"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, dagrun_id=manual__2022-11-09T19:10:00.504114+00:00, map_index=-1, run_start_date=2022-11-09 19:10:13.094086+00:00, try_number=1, job_id=546, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-09 19:10:00.504114+00:00 +INFO - Started process 694 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskLoad', 'manual__2022-11-09T19:10:00.504114+00:00', '--job-id', '546', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmpehbd67zx'] +INFO - Job 546: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 03a0f0f60b55 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-09T19:10:00.504114+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-09T19:10:00.504114+00:00 +INFO - '2022-11-09' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-09' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-09' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-09' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-09' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-09' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-09' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-09' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-09' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-09' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f289e61fe50> +INFO - '2022-11-09' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-09' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-09' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-09' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-09' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-09' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-09' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-09' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-09' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-09' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-09' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-09' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-09' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/preprocess/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'JapneMNQm8Feta9PPETrqQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/preprocess/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-09' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/preprocess/GBUNComahue_process.txt +INFO - '2022-11-09' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/preprocess/GBUNComahue_process.txt +INFO - '2022-11-09' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-09' - botocore.auth - CanonicalRequest: +PUT +/preprocess/GBUNComahue_process.txt + +content-md5:JapneMNQm8Feta9PPETrqQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221109T191013Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-09' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221109T191013Z +20221109/us-east-1/s3/aws4_request +3ec529e6ee1ce38dbd7988b6f8651b4b9c34b6416a00f7072758aca5bfe885de +INFO - '2022-11-09' - botocore.auth - Signature: +a3259b2c6d9cd3ea80f9e955dccb662c649cec717fb3a35e86484298bcdf1042 +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.endpoint - Sending http request: +INFO - '2022-11-09' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-09' - urllib3.connectionpool - Starting new HTTPS connection (1): alkemy-2022-broc.s3.amazonaws.com:443 +INFO - '2022-11-09' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-09' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-09' - urllib3.connectionpool - https://alkemy-2022-broc.s3.amazonaws.com:443 "PUT /preprocess/GBUNComahue_process.txt HTTP/1.1" 200 0 +INFO - '2022-11-09' - botocore.parsers - Response headers: {'x-amz-id-2': 'OYDfA1CPOW+ppRNgCoslOKsimEpJm4HipIf/4Dyont2oCjlBVyTWekrCczGSDBDL1GMxC72fwXQ=', 'x-amz-request-id': 'CVAPNNCWYGDSRZ7N', 'Date': 'Wed, 09 Nov 2022 19:10:12 GMT', 'ETag': '"25aa6778c3509bc15eb5af4f3c44eba9"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-09' - botocore.parsers - Response body: +b'' +INFO - '2022-11-09' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.retryhandler - No retry needed. +INFO - '2022-11-09' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-09' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, execution_date=20221109T191000, start_date=20221109T191013, end_date=20221109T191015 +INFO - '2022-11-09' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-09' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-09' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskLoad airflow_run_id=manual__2022-11-09T19:10:00.504114+00:00 +INFO - '2022-11-09' - root - Found task metadata for operation TaskLoad: TaskMetadata(name='GBUNComahue_dag_elt.TaskLoad', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskLoad', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskLoad', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskTransform'}, 'downstream_task_ids': set(), 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-09' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-09' - openlineage.client.transport.console - {"eventTime": "2022-11-09T19:10:15.135178Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "026314d4-103f-4d37-9ede-6e98ca38c76c"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27210\357\200\27200.504114+00\357\200\27200/task_id=TaskTransform/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27210\357\200\27200.504114+00\357\200\27200/task_id=TaskTransform/attempt=1.log" new file mode 100644 index 00000000..6395c10b --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27210\357\200\27200.504114+00\357\200\27200/task_id=TaskTransform/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-09T19:10:06.979908Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskLoad'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskExtract'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-09T19:10:00.504114Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "b38d3e79-bbd7-3630-a1ed-e2331d809d3a"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "b38d3e79-bbd7-3630-a1ed-e2331d809d3a"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "16bc74dd-ae33-4190-ba64-fa74c2c39407"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskTransform, dagrun_id=manual__2022-11-09T19:10:00.504114+00:00, map_index=-1, run_start_date=2022-11-09 19:10:06.979908+00:00, try_number=1, job_id=544, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-09 19:10:00.504114+00:00 +INFO - Started process 682 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskTransform', 'manual__2022-11-09T19:10:00.504114+00:00', '--job-id', '544', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmpdbiw4ri9'] +INFO - Job 544: Subtask TaskTransform +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 03a0f0f60b55 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskTransform +AIRFLOW_CTX_EXECUTION_DATE=2022-11-09T19:10:00.504114+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-09T19:10:00.504114+00:00 +INFO - '2022-11-09' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskTransform, execution_date=20221109T191000, start_date=20221109T191006, end_date=20221109T191011 +INFO - '2022-11-09' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-09' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-09' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskTransform airflow_run_id=manual__2022-11-09T19:10:00.504114+00:00 +INFO - '2022-11-09' - root - Found task metadata for operation TaskTransform: TaskMetadata(name='GBUNComahue_dag_elt.TaskTransform', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskTransform', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskTransform', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskExtract'}, 'downstream_task_ids': {'TaskLoad'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-09' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-09' - openlineage.client.transport.console - {"eventTime": "2022-11-09T19:10:11.625564Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "16bc74dd-ae33-4190-ba64-fa74c2c39407"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27211\357\200\27257.287173+00\357\200\27200/task_id=TaskExtract/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27211\357\200\27257.287173+00\357\200\27200/task_id=TaskExtract/attempt=1.log" new file mode 100644 index 00000000..49337338 --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27211\357\200\27257.287173+00\357\200\27200/task_id=TaskExtract/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-09T19:11:58.263163Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-09T19:11:57.287173Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "ad315108-7d36-3327-83eb-41ea0de7743e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "ad315108-7d36-3327-83eb-41ea0de7743e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0d6131c9-81da-4a94-9a50-04fbf32f21d3"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, dagrun_id=manual__2022-11-09T19:11:57.287173+00:00, map_index=-1, run_start_date=2022-11-09 19:11:58.263163+00:00, try_number=1, job_id=553, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-09 19:11:57.287173+00:00 +INFO - Started process 930 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskExtract', 'manual__2022-11-09T19:11:57.287173+00:00', '--job-id', '553', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmpi8ivcaf3'] +INFO - Job 553: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 03a0f0f60b55 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-09T19:11:57.287173+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-09T19:11:57.287173+00:00 +INFO - '2022-11-09' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-09' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-09' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-09' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-09' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-09' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, execution_date=20221109T191157, start_date=20221109T191158, end_date=20221109T191201 +INFO - '2022-11-09' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-09' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-09' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskExtract airflow_run_id=manual__2022-11-09T19:11:57.287173+00:00 +INFO - '2022-11-09' - root - Found task metadata for operation TaskExtract: TaskMetadata(name='GBUNComahue_dag_elt.TaskExtract', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskExtract', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskExtract', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'TaskTransform'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-09' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-09' - openlineage.client.transport.console - {"eventTime": "2022-11-09T19:12:01.920334Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0d6131c9-81da-4a94-9a50-04fbf32f21d3"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27211\357\200\27257.287173+00\357\200\27200/task_id=TaskLoad/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27211\357\200\27257.287173+00\357\200\27200/task_id=TaskLoad/attempt=1.log" new file mode 100644 index 00000000..8209bc4e --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27211\357\200\27257.287173+00\357\200\27200/task_id=TaskLoad/attempt=1.log" @@ -0,0 +1,123 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-09T19:12:09.677249Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-09T19:11:57.287173Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "ad315108-7d36-3327-83eb-41ea0de7743e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "ad315108-7d36-3327-83eb-41ea0de7743e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b007d15d-3abc-427f-8415-c8de6971a851"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, dagrun_id=manual__2022-11-09T19:11:57.287173+00:00, map_index=-1, run_start_date=2022-11-09 19:12:09.677249+00:00, try_number=1, job_id=557, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-09 19:11:57.287173+00:00 +INFO - Started process 956 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskLoad', 'manual__2022-11-09T19:11:57.287173+00:00', '--job-id', '557', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmpq200wamn'] +INFO - Job 557: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 03a0f0f60b55 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-09T19:11:57.287173+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-09T19:11:57.287173+00:00 +INFO - '2022-11-09' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-09' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-09' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-09' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-09' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-09' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-09' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-09' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-09' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-09' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f289e61fe50> +INFO - '2022-11-09' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-09' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-09' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-09' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-09' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-09' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-09' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-09' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-09' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-09' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-09' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-09' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-09' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/preprocess/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '4N/KLWchwT4Oj3PQFUt+sQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/preprocess/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-09' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/preprocess/GBUNComahue_process.txt +INFO - '2022-11-09' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/preprocess/GBUNComahue_process.txt +INFO - '2022-11-09' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-09' - botocore.auth - CanonicalRequest: +PUT +/preprocess/GBUNComahue_process.txt + +content-md5:4N/KLWchwT4Oj3PQFUt+sQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221109T191210Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-09' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221109T191210Z +20221109/us-east-1/s3/aws4_request +703e7b7525458129bc83de0d4c5b1230e0a9ec2ea08196b2f8f53ca212aa33e0 +INFO - '2022-11-09' - botocore.auth - Signature: +880f1e10b27633cdafce0ac8811f4b7393eec30ab71a06a6cef3e8ad099241ab +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.endpoint - Sending http request: +INFO - '2022-11-09' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-09' - urllib3.connectionpool - Starting new HTTPS connection (1): alkemy-2022-broc.s3.amazonaws.com:443 +INFO - '2022-11-09' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-09' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-09' - urllib3.connectionpool - https://alkemy-2022-broc.s3.amazonaws.com:443 "PUT /preprocess/GBUNComahue_process.txt HTTP/1.1" 200 0 +INFO - '2022-11-09' - botocore.parsers - Response headers: {'x-amz-id-2': 'HYLBF8Jl8hZfRAfK2hZibCSlnTwSBwvvODoTWIidhdOVtnD8j7rYRkg17xQqtwteQsl/P3cl3wY=', 'x-amz-request-id': 'TYRJHBBH5H2J397Y', 'Date': 'Wed, 09 Nov 2022 19:12:09 GMT', 'ETag': '"e0dfca2d6721c13e0e8f73d0154b7eb1"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-09' - botocore.parsers - Response body: +b'' +INFO - '2022-11-09' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.retryhandler - No retry needed. +INFO - '2022-11-09' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-09' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, execution_date=20221109T191157, start_date=20221109T191209, end_date=20221109T191211 +INFO - '2022-11-09' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-09' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-09' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskLoad airflow_run_id=manual__2022-11-09T19:11:57.287173+00:00 +INFO - '2022-11-09' - root - Found task metadata for operation TaskLoad: TaskMetadata(name='GBUNComahue_dag_elt.TaskLoad', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskLoad', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskLoad', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskTransform'}, 'downstream_task_ids': set(), 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-09' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-09' - openlineage.client.transport.console - {"eventTime": "2022-11-09T19:12:11.653186Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b007d15d-3abc-427f-8415-c8de6971a851"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27211\357\200\27257.287173+00\357\200\27200/task_id=TaskTransform/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27211\357\200\27257.287173+00\357\200\27200/task_id=TaskTransform/attempt=1.log" new file mode 100644 index 00000000..6d6c44cc --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27211\357\200\27257.287173+00\357\200\27200/task_id=TaskTransform/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-09T19:12:03.504763Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskLoad'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskExtract'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-09T19:11:57.287173Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "ad315108-7d36-3327-83eb-41ea0de7743e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "ad315108-7d36-3327-83eb-41ea0de7743e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2f11f7a0-f992-4665-bad5-cee953147630"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskTransform, dagrun_id=manual__2022-11-09T19:11:57.287173+00:00, map_index=-1, run_start_date=2022-11-09 19:12:03.504763+00:00, try_number=1, job_id=555, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-09 19:11:57.287173+00:00 +INFO - Started process 939 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskTransform', 'manual__2022-11-09T19:11:57.287173+00:00', '--job-id', '555', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmpeyo8l1ay'] +INFO - Job 555: Subtask TaskTransform +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 03a0f0f60b55 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskTransform +AIRFLOW_CTX_EXECUTION_DATE=2022-11-09T19:11:57.287173+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-09T19:11:57.287173+00:00 +INFO - '2022-11-09' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskTransform, execution_date=20221109T191157, start_date=20221109T191203, end_date=20221109T191208 +INFO - '2022-11-09' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-09' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-09' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskTransform airflow_run_id=manual__2022-11-09T19:11:57.287173+00:00 +INFO - '2022-11-09' - root - Found task metadata for operation TaskTransform: TaskMetadata(name='GBUNComahue_dag_elt.TaskTransform', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskTransform', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskTransform', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskExtract'}, 'downstream_task_ids': {'TaskLoad'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-09' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-09' - openlineage.client.transport.console - {"eventTime": "2022-11-09T19:12:08.137628Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2f11f7a0-f992-4665-bad5-cee953147630"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27212\357\200\27206.835125+00\357\200\27200/task_id=TaskExtract/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27212\357\200\27206.835125+00\357\200\27200/task_id=TaskExtract/attempt=1.log" new file mode 100644 index 00000000..e9e5d9bf --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27212\357\200\27206.835125+00\357\200\27200/task_id=TaskExtract/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-09T19:12:08.588056Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-09T19:12:06.835125Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "818350ee-37cf-33e6-87e5-e0288d67f962"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "818350ee-37cf-33e6-87e5-e0288d67f962"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6f31130a-4bf1-4a8b-8976-29667b4753ca"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, dagrun_id=manual__2022-11-09T19:12:06.835125+00:00, map_index=-1, run_start_date=2022-11-09 19:12:08.588056+00:00, try_number=1, job_id=556, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-09 19:12:06.835125+00:00 +INFO - Started process 952 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskExtract', 'manual__2022-11-09T19:12:06.835125+00:00', '--job-id', '556', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmpmmzfr9bu'] +INFO - Job 556: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 03a0f0f60b55 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-09T19:12:06.835125+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-09T19:12:06.835125+00:00 +INFO - '2022-11-09' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-09' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-09' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-09' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-09' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-09' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, execution_date=20221109T191206, start_date=20221109T191208, end_date=20221109T191211 +INFO - '2022-11-09' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-09' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-09' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskExtract airflow_run_id=manual__2022-11-09T19:12:06.835125+00:00 +INFO - '2022-11-09' - root - Found task metadata for operation TaskExtract: TaskMetadata(name='GBUNComahue_dag_elt.TaskExtract', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskExtract', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskExtract', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'TaskTransform'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-09' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-09' - openlineage.client.transport.console - {"eventTime": "2022-11-09T19:12:11.914138Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6f31130a-4bf1-4a8b-8976-29667b4753ca"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27212\357\200\27206.835125+00\357\200\27200/task_id=TaskLoad/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27212\357\200\27206.835125+00\357\200\27200/task_id=TaskLoad/attempt=1.log" new file mode 100644 index 00000000..398323cc --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27212\357\200\27206.835125+00\357\200\27200/task_id=TaskLoad/attempt=1.log" @@ -0,0 +1,123 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-09T19:12:18.670777Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-09T19:12:06.835125Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "818350ee-37cf-33e6-87e5-e0288d67f962"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "818350ee-37cf-33e6-87e5-e0288d67f962"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "04862a89-d574-446f-bb65-86ac0d33c70a"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, dagrun_id=manual__2022-11-09T19:12:06.835125+00:00, map_index=-1, run_start_date=2022-11-09 19:12:18.670777+00:00, try_number=1, job_id=559, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-09 19:12:06.835125+00:00 +INFO - Started process 974 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskLoad', 'manual__2022-11-09T19:12:06.835125+00:00', '--job-id', '559', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmptslj7mm_'] +INFO - Job 559: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 03a0f0f60b55 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-09T19:12:06.835125+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-09T19:12:06.835125+00:00 +INFO - '2022-11-09' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-09' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-09' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-09' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-09' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-09' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-09' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-09' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-09' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-09' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f289e620e50> +INFO - '2022-11-09' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-09' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-09' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-09' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-09' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-09' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-09' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-09' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-09' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-09' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-09' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-09' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-09' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/preprocess/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'RJFnRXIUPUhhLRCsMhht+A==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/preprocess/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-09' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/preprocess/GBUNComahue_process.txt +INFO - '2022-11-09' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/preprocess/GBUNComahue_process.txt +INFO - '2022-11-09' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-09' - botocore.auth - CanonicalRequest: +PUT +/preprocess/GBUNComahue_process.txt + +content-md5:RJFnRXIUPUhhLRCsMhht+A== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221109T191219Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-09' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221109T191219Z +20221109/us-east-1/s3/aws4_request +da2c231f44b43d7ff11fc16a45643647bb51ee2b584b3a7fd995f1ed35227a7c +INFO - '2022-11-09' - botocore.auth - Signature: +2120355406019266a5074fcdc863a7ab8aae1208c90714bccdaeaaa2afe6b2f3 +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.endpoint - Sending http request: +INFO - '2022-11-09' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-09' - urllib3.connectionpool - Starting new HTTPS connection (1): alkemy-2022-broc.s3.amazonaws.com:443 +INFO - '2022-11-09' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-09' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-09' - urllib3.connectionpool - https://alkemy-2022-broc.s3.amazonaws.com:443 "PUT /preprocess/GBUNComahue_process.txt HTTP/1.1" 200 0 +INFO - '2022-11-09' - botocore.parsers - Response headers: {'x-amz-id-2': 'oOgC6XNrosrITm9mT56dCgnN50py4gXRc8Zzr+XExLfDWrMtRa+eQhy2X0LOALWRzx4hyjmnOPUbi6KxXQbBqQ==', 'x-amz-request-id': '7854Z2GGJGH7Y437', 'Date': 'Wed, 09 Nov 2022 19:12:18 GMT', 'ETag': '"4491674572143d48612d10ac32186df8"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-09' - botocore.parsers - Response body: +b'' +INFO - '2022-11-09' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.retryhandler - No retry needed. +INFO - '2022-11-09' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-09' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, execution_date=20221109T191206, start_date=20221109T191218, end_date=20221109T191221 +INFO - '2022-11-09' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-09' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-09' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskLoad airflow_run_id=manual__2022-11-09T19:12:06.835125+00:00 +INFO - '2022-11-09' - root - Found task metadata for operation TaskLoad: TaskMetadata(name='GBUNComahue_dag_elt.TaskLoad', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskLoad', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskLoad', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskTransform'}, 'downstream_task_ids': set(), 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-09' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-09' - openlineage.client.transport.console - {"eventTime": "2022-11-09T19:12:21.081828Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "04862a89-d574-446f-bb65-86ac0d33c70a"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27212\357\200\27206.835125+00\357\200\27200/task_id=TaskTransform/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27212\357\200\27206.835125+00\357\200\27200/task_id=TaskTransform/attempt=1.log" new file mode 100644 index 00000000..79015ba5 --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27212\357\200\27206.835125+00\357\200\27200/task_id=TaskTransform/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-09T19:12:13.298953Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskLoad'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskExtract'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-09T19:12:06.835125Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "818350ee-37cf-33e6-87e5-e0288d67f962"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "818350ee-37cf-33e6-87e5-e0288d67f962"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5db52dba-fe46-4db9-a292-72f9cb00d86b"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskTransform, dagrun_id=manual__2022-11-09T19:12:06.835125+00:00, map_index=-1, run_start_date=2022-11-09 19:12:13.298953+00:00, try_number=1, job_id=558, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-09 19:12:06.835125+00:00 +INFO - Started process 964 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskTransform', 'manual__2022-11-09T19:12:06.835125+00:00', '--job-id', '558', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmp1ze9z16c'] +INFO - Job 558: Subtask TaskTransform +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 03a0f0f60b55 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskTransform +AIRFLOW_CTX_EXECUTION_DATE=2022-11-09T19:12:06.835125+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-09T19:12:06.835125+00:00 +INFO - '2022-11-09' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskTransform, execution_date=20221109T191206, start_date=20221109T191213, end_date=20221109T191218 +INFO - '2022-11-09' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-09' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-09' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskTransform airflow_run_id=manual__2022-11-09T19:12:06.835125+00:00 +INFO - '2022-11-09' - root - Found task metadata for operation TaskTransform: TaskMetadata(name='GBUNComahue_dag_elt.TaskTransform', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskTransform', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskTransform', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskExtract'}, 'downstream_task_ids': {'TaskLoad'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-09' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-09' - openlineage.client.transport.console - {"eventTime": "2022-11-09T19:12:18.085421Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5db52dba-fe46-4db9-a292-72f9cb00d86b"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27221\357\200\27231.545458+00\357\200\27200/task_id=TaskExtract/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27221\357\200\27231.545458+00\357\200\27200/task_id=TaskExtract/attempt=1.log" new file mode 100644 index 00000000..808c7e5e --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27221\357\200\27231.545458+00\357\200\27200/task_id=TaskExtract/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-09T19:21:32.870723Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-09T19:21:31.545458Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "02bbbaa2-3cf0-3eb7-8f1c-d94eeb61a095"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "02bbbaa2-3cf0-3eb7-8f1c-d94eeb61a095"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f1f77bf7-d139-4340-9e11-448207bc2532"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, dagrun_id=manual__2022-11-09T19:21:31.545458+00:00, map_index=-1, run_start_date=2022-11-09 19:21:32.870723+00:00, try_number=1, job_id=563, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-09 19:21:31.545458+00:00 +INFO - Started process 1936 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskExtract', 'manual__2022-11-09T19:21:31.545458+00:00', '--job-id', '563', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmpq4h3l7e4'] +INFO - Job 563: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 03a0f0f60b55 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-09T19:21:31.545458+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-09T19:21:31.545458+00:00 +INFO - '2022-11-09' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-09' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-09' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-09' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-09' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-09' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, execution_date=20221109T192131, start_date=20221109T192132, end_date=20221109T192136 +INFO - '2022-11-09' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-09' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-09' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskExtract airflow_run_id=manual__2022-11-09T19:21:31.545458+00:00 +INFO - '2022-11-09' - root - Found task metadata for operation TaskExtract: TaskMetadata(name='GBUNComahue_dag_elt.TaskExtract', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskExtract', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskExtract', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'TaskTransform'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-09' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-09' - openlineage.client.transport.console - {"eventTime": "2022-11-09T19:21:36.547278Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f1f77bf7-d139-4340-9e11-448207bc2532"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27221\357\200\27231.545458+00\357\200\27200/task_id=TaskLoad/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27221\357\200\27231.545458+00\357\200\27200/task_id=TaskLoad/attempt=1.log" new file mode 100644 index 00000000..7b73e2ca --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27221\357\200\27231.545458+00\357\200\27200/task_id=TaskLoad/attempt=1.log" @@ -0,0 +1,123 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-09T19:21:41.452588Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-09T19:21:31.545458Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "02bbbaa2-3cf0-3eb7-8f1c-d94eeb61a095"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "02bbbaa2-3cf0-3eb7-8f1c-d94eeb61a095"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "12b66282-7b87-4fbe-9c36-5798b3cf5002"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, dagrun_id=manual__2022-11-09T19:21:31.545458+00:00, map_index=-1, run_start_date=2022-11-09 19:21:41.452588+00:00, try_number=1, job_id=565, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-09 19:21:31.545458+00:00 +INFO - Started process 1958 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskLoad', 'manual__2022-11-09T19:21:31.545458+00:00', '--job-id', '565', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmp43fwy9l0'] +INFO - Job 565: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 03a0f0f60b55 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-09T19:21:31.545458+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-09T19:21:31.545458+00:00 +INFO - '2022-11-09' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-09' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-09' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-09' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-09' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-09' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-09' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-09' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-09' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-09' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f289e61ee50> +INFO - '2022-11-09' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-09' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-09' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-09' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-09' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-09' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-09' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-09' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-09' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-09' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-09' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-09' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-09' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/preprocess/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'MDaSkrWwZoE7zgrvs8F/rw==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/preprocess/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-09' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/preprocess/GBUNComahue_process.txt +INFO - '2022-11-09' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/preprocess/GBUNComahue_process.txt +INFO - '2022-11-09' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-09' - botocore.auth - CanonicalRequest: +PUT +/preprocess/GBUNComahue_process.txt + +content-md5:MDaSkrWwZoE7zgrvs8F/rw== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221109T192142Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-09' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221109T192142Z +20221109/us-east-1/s3/aws4_request +f96abc69c8058e88a72b02dffdd2d1e81c3a42c70a6beecd56fa13d7e070b00e +INFO - '2022-11-09' - botocore.auth - Signature: +c2e4f19dea60a60e0ed604e2b8a82dff733fa8e07336a7c1b18d3057fa567a2a +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.endpoint - Sending http request: +INFO - '2022-11-09' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-09' - urllib3.connectionpool - Starting new HTTPS connection (1): alkemy-2022-broc.s3.amazonaws.com:443 +INFO - '2022-11-09' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-09' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-09' - urllib3.connectionpool - https://alkemy-2022-broc.s3.amazonaws.com:443 "PUT /preprocess/GBUNComahue_process.txt HTTP/1.1" 200 0 +INFO - '2022-11-09' - botocore.parsers - Response headers: {'x-amz-id-2': 'LhS6ye0JYXReFv9wbWcysZ9ZRUarzGDkZDXYNioX2/ZX70FDyIiYgWapwtYqMahZyuhm6gyMvKU=', 'x-amz-request-id': '9M48JM2PYXA2JH8V', 'Date': 'Wed, 09 Nov 2022 19:21:41 GMT', 'ETag': '"30369292b5b066813bce0aefb3c17faf"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-09' - botocore.parsers - Response body: +b'' +INFO - '2022-11-09' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.retryhandler - No retry needed. +INFO - '2022-11-09' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-09' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, execution_date=20221109T192131, start_date=20221109T192141, end_date=20221109T192143 +INFO - '2022-11-09' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-09' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-09' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskLoad airflow_run_id=manual__2022-11-09T19:21:31.545458+00:00 +INFO - '2022-11-09' - root - Found task metadata for operation TaskLoad: TaskMetadata(name='GBUNComahue_dag_elt.TaskLoad', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskLoad', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskLoad', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskTransform'}, 'downstream_task_ids': set(), 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-09' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-09' - openlineage.client.transport.console - {"eventTime": "2022-11-09T19:21:43.688317Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "12b66282-7b87-4fbe-9c36-5798b3cf5002"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27221\357\200\27231.545458+00\357\200\27200/task_id=TaskTransform/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27221\357\200\27231.545458+00\357\200\27200/task_id=TaskTransform/attempt=1.log" new file mode 100644 index 00000000..76dc53ea --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-09T19\357\200\27221\357\200\27231.545458+00\357\200\27200/task_id=TaskTransform/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-09T19:21:37.426050Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskLoad'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskExtract'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-09T19:21:31.545458Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "02bbbaa2-3cf0-3eb7-8f1c-d94eeb61a095"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "02bbbaa2-3cf0-3eb7-8f1c-d94eeb61a095"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6ae3d0de-4a74-45c3-a578-5efd24ffdb11"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskTransform, dagrun_id=manual__2022-11-09T19:21:31.545458+00:00, map_index=-1, run_start_date=2022-11-09 19:21:37.426050+00:00, try_number=1, job_id=564, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-09 19:21:31.545458+00:00 +INFO - Started process 1953 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskTransform', 'manual__2022-11-09T19:21:31.545458+00:00', '--job-id', '564', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmp5c46lpjr'] +INFO - Job 564: Subtask TaskTransform +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 03a0f0f60b55 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskTransform +AIRFLOW_CTX_EXECUTION_DATE=2022-11-09T19:21:31.545458+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-09T19:21:31.545458+00:00 +INFO - '2022-11-09' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskTransform, execution_date=20221109T192131, start_date=20221109T192137, end_date=20221109T192140 +INFO - '2022-11-09' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-09' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-09' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskTransform airflow_run_id=manual__2022-11-09T19:21:31.545458+00:00 +INFO - '2022-11-09' - root - Found task metadata for operation TaskTransform: TaskMetadata(name='GBUNComahue_dag_elt.TaskTransform', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskTransform', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskTransform', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskExtract'}, 'downstream_task_ids': {'TaskLoad'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-09' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-09' - openlineage.client.transport.console - {"eventTime": "2022-11-09T19:21:40.339524Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "6ae3d0de-4a74-45c3-a578-5efd24ffdb11"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27211\357\200\27237.114429+00\357\200\27200/task_id=TaskExtract/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27211\357\200\27237.114429+00\357\200\27200/task_id=TaskExtract/attempt=1.log" new file mode 100644 index 00000000..b57a3c3d --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27211\357\200\27237.114429+00\357\200\27200/task_id=TaskExtract/attempt=1.log" @@ -0,0 +1,51 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:11:38.579160Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "_TaskDecorator(function=, operator_class=, multiple_outputs=False, kwargs={'task_id': 'extract'})", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "_TaskDecorator(function=, operator_class=, multiple_outputs=False, kwargs={'task_id': 'extract'})", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T06:11:37.114429Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "ff6a1ccb-f259-3032-b9c1-ffad4697cf0e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "ff6a1ccb-f259-3032-b9c1-ffad4697cf0e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": {"decorator_name": "task", "function": "<>", "kwargs": {"task_id": "extract"}, "multiple_outputs": false, "operator_class": "<>"}, "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": {"decorator_name": "task", "function": "<>", "kwargs": {"task_id": "extract"}, "multiple_outputs": false, "operator_class": "<>"}, "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0b9576e6-0767-4185-9201-1587d6f387cd"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, dagrun_id=manual__2022-11-10T06:11:37.114429+00:00, map_index=-1, run_start_date=2022-11-10 06:11:38.579160+00:00, try_number=1, job_id=579, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 06:11:37.114429+00:00 +INFO - Started process 1417 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskExtract', 'manual__2022-11-10T06:11:37.114429+00:00', '--job-id', '579', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmp6zycxfvc'] +INFO - Job 579: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T06:11:37.114429+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T06:11:37.114429+00:00 +INFO - Done. Returned value was: {{ task_instance.xcom_pull(task_ids='extract', dag_id='adhoc_airflow', key='return_value') }} +ERROR - Could not serialize the XCom value into JSON. If you are using pickle instead of JSON for XCom, then you need to enable pickle support for XCom in your airflow config. +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/utils/session.py", line 72, in wrapper + return func(*args, **kwargs) + File "/usr/local/lib/python3.9/site-packages/airflow/models/taskinstance.py", line 2378, in xcom_push + XCom.set( + File "/usr/local/lib/python3.9/site-packages/airflow/utils/session.py", line 72, in wrapper + return func(*args, **kwargs) + File "/usr/local/lib/python3.9/site-packages/airflow/models/xcom.py", line 206, in set + value = cls.serialize_value( + File "/usr/local/lib/python3.9/site-packages/airflow/models/xcom.py", line 597, in serialize_value + return json.dumps(value).encode('UTF-8') + File "/usr/local/lib/python3.9/json/__init__.py", line 231, in dumps + return _default_encoder.encode(obj) + File "/usr/local/lib/python3.9/json/encoder.py", line 199, in encode + chunks = self.iterencode(o, _one_shot=True) + File "/usr/local/lib/python3.9/json/encoder.py", line 257, in iterencode + return _iterencode(o, 0) + File "/usr/local/lib/python3.9/json/encoder.py", line 179, in default + raise TypeError(f'Object of type {o.__class__.__name__} ' +TypeError: Object of type PlainXComArg is not JSON serializable +INFO - Marking task as UP_FOR_RETRY. dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, execution_date=20221110T061137, start_date=20221110T061138, end_date=20221110T061139 +ERROR - Failed to execute job 579 for task TaskExtract (Object of type PlainXComArg is not JSON serializable; 1417) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27211\357\200\27237.114429+00\357\200\27200/task_id=TaskExtract/attempt=2.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27211\357\200\27237.114429+00\357\200\27200/task_id=TaskExtract/attempt=2.log" new file mode 100644 index 00000000..e3423f6d --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27211\357\200\27237.114429+00\357\200\27200/task_id=TaskExtract/attempt=2.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 2 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:21:39.909286Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T06:11:37.114429Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "ff6a1ccb-f259-3032-b9c1-ffad4697cf0e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "ff6a1ccb-f259-3032-b9c1-ffad4697cf0e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e3aac47e-84be-4c3f-a632-aba729ed6641"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, dagrun_id=manual__2022-11-10T06:11:37.114429+00:00, map_index=-1, run_start_date=2022-11-10 06:21:39.909286+00:00, try_number=2, job_id=590, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 06:11:37.114429+00:00 +INFO - Started process 2453 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskExtract', 'manual__2022-11-10T06:11:37.114429+00:00', '--job-id', '590', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmp_byyp3rd'] +INFO - Job 590: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T06:11:37.114429+00:00 +AIRFLOW_CTX_TRY_NUMBER=2 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T06:11:37.114429+00:00 +INFO - '2022-11-10' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-10' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-10' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-10' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, execution_date=20221110T061137, start_date=20221110T062139, end_date=20221110T062143 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskExtract airflow_run_id=manual__2022-11-10T06:11:37.114429+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskExtract: TaskMetadata(name='GBUNComahue_dag_elt.TaskExtract', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskExtract', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskExtract', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'TaskTransform'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T06:21:43.186882Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e3aac47e-84be-4c3f-a632-aba729ed6641"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27211\357\200\27237.114429+00\357\200\27200/task_id=TaskLoad/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27211\357\200\27237.114429+00\357\200\27200/task_id=TaskLoad/attempt=1.log" new file mode 100644 index 00000000..277affe8 --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27211\357\200\27237.114429+00\357\200\27200/task_id=TaskLoad/attempt=1.log" @@ -0,0 +1,124 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:21:47.829558Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T06:11:37.114429Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "ff6a1ccb-f259-3032-b9c1-ffad4697cf0e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "ff6a1ccb-f259-3032-b9c1-ffad4697cf0e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "31f98ce4-fe02-46b3-b4f3-7a3f429b007c"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, dagrun_id=manual__2022-11-10T06:11:37.114429+00:00, map_index=-1, run_start_date=2022-11-10 06:21:47.829558+00:00, try_number=1, job_id=594, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 06:11:37.114429+00:00 +INFO - Started process 2472 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskLoad', 'manual__2022-11-10T06:11:37.114429+00:00', '--job-id', '594', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmpzom_utrr'] +INFO - Job 594: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T06:11:37.114429+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T06:11:37.114429+00:00 +INFO - '2022-11-10' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-10' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-10' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-10' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fcc542848b0> +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-10' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-10' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/dipa-s3/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'r53hmRPSCIRyITb6RL7Qdw==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/dipa-s3/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'dipa-s3'}}} +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-10' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/dipa-s3/GBUNComahue_process.txt +INFO - '2022-11-10' - botocore.utils - URI updated to: https://dipa-s3.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-10' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-10' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:r53hmRPSCIRyITb6RL7Qdw== +host:dipa-s3.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221110T062148Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-10' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221110T062148Z +20221110/us-east-1/s3/aws4_request +b682353e2184570d1d35a8b9c1851258065bbd7e5662be7fbcffd4dccb6f62f5 +INFO - '2022-11-10' - botocore.auth - Signature: +d220e52be653b15046c7ca42a31315776563835a6982f8d3ad9856c01448fe4c +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Sending http request: +INFO - '2022-11-10' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTPS connection (1): dipa-s3.s3.amazonaws.com:443 +INFO - '2022-11-10' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-10' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-10' - urllib3.connectionpool - https://dipa-s3.s3.amazonaws.com:443 "PUT /GBUNComahue_process.txt HTTP/1.1" 200 0 +INFO - '2022-11-10' - botocore.parsers - Response headers: {'x-amz-id-2': 'vqu2LT5HpDXHifYnbpk0slwm+IzDzwmHh32vcdgJFEpJTEGjyINWI3YRGHH6owSYzvovD7ub+WA=', 'x-amz-request-id': '42BGJKA3BXT77D8P', 'Date': 'Thu, 10 Nov 2022 06:21:49 GMT', 'ETag': '"af9de19913d20884722136fa44bed077"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-10' - botocore.parsers - Response body: +b'' +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.retryhandler - No retry needed. +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, execution_date=20221110T061137, start_date=20221110T062147, end_date=20221110T062150 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskLoad airflow_run_id=manual__2022-11-10T06:11:37.114429+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskLoad: TaskMetadata(name='GBUNComahue_dag_elt.TaskLoad', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskLoad', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskLoad', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskTransform'}, 'downstream_task_ids': set(), 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T06:21:50.145926Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "31f98ce4-fe02-46b3-b4f3-7a3f429b007c"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27211\357\200\27237.114429+00\357\200\27200/task_id=TaskTransform/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27211\357\200\27237.114429+00\357\200\27200/task_id=TaskTransform/attempt=1.log" new file mode 100644 index 00000000..4071abff --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27211\357\200\27237.114429+00\357\200\27200/task_id=TaskTransform/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:21:43.924751Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskLoad'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskExtract'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T06:11:37.114429Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "ff6a1ccb-f259-3032-b9c1-ffad4697cf0e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "ff6a1ccb-f259-3032-b9c1-ffad4697cf0e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d2e9e141-d8e0-4c10-9880-02e63ca4eda1"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskTransform, dagrun_id=manual__2022-11-10T06:11:37.114429+00:00, map_index=-1, run_start_date=2022-11-10 06:21:43.924751+00:00, try_number=1, job_id=591, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 06:11:37.114429+00:00 +INFO - Started process 2462 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskTransform', 'manual__2022-11-10T06:11:37.114429+00:00', '--job-id', '591', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmpqffq3rpt'] +INFO - Job 591: Subtask TaskTransform +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskTransform +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T06:11:37.114429+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T06:11:37.114429+00:00 +INFO - '2022-11-10' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskTransform, execution_date=20221110T061137, start_date=20221110T062143, end_date=20221110T062147 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskTransform airflow_run_id=manual__2022-11-10T06:11:37.114429+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskTransform: TaskMetadata(name='GBUNComahue_dag_elt.TaskTransform', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskTransform', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskTransform', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskExtract'}, 'downstream_task_ids': {'TaskLoad'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T06:21:47.126660Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d2e9e141-d8e0-4c10-9880-02e63ca4eda1"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27216\357\200\27201.763303+00\357\200\27200/task_id=TaskExtract/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27216\357\200\27201.763303+00\357\200\27200/task_id=TaskExtract/attempt=1.log" new file mode 100644 index 00000000..da18ea66 --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27216\357\200\27201.763303+00\357\200\27200/task_id=TaskExtract/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:16:02.787543Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T06:16:01.763303Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "d2e6f074-7327-3335-b623-8a77bdced34c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "d2e6f074-7327-3335-b623-8a77bdced34c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "323f665d-701e-48cb-b5c6-9579a877aaf3"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, dagrun_id=manual__2022-11-10T06:16:01.763303+00:00, map_index=-1, run_start_date=2022-11-10 06:16:02.787543+00:00, try_number=1, job_id=583, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 06:16:01.763303+00:00 +INFO - Started process 1890 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskExtract', 'manual__2022-11-10T06:16:01.763303+00:00', '--job-id', '583', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmpj39bc6mt'] +INFO - Job 583: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T06:16:01.763303+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T06:16:01.763303+00:00 +INFO - '2022-11-10' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-10' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-10' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-10' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, execution_date=20221110T061601, start_date=20221110T061602, end_date=20221110T061606 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskExtract airflow_run_id=manual__2022-11-10T06:16:01.763303+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskExtract: TaskMetadata(name='GBUNComahue_dag_elt.TaskExtract', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskExtract', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskExtract', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'TaskTransform'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T06:16:06.076474Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "323f665d-701e-48cb-b5c6-9579a877aaf3"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27216\357\200\27201.763303+00\357\200\27200/task_id=TaskLoad/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27216\357\200\27201.763303+00\357\200\27200/task_id=TaskLoad/attempt=1.log" new file mode 100644 index 00000000..bee76477 --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27216\357\200\27201.763303+00\357\200\27200/task_id=TaskLoad/attempt=1.log" @@ -0,0 +1,124 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:16:11.511474Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T06:16:01.763303Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "d2e6f074-7327-3335-b623-8a77bdced34c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "d2e6f074-7327-3335-b623-8a77bdced34c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d1bbf407-f00c-4b77-9b1a-9db8e23dea75"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, dagrun_id=manual__2022-11-10T06:16:01.763303+00:00, map_index=-1, run_start_date=2022-11-10 06:16:11.511474+00:00, try_number=1, job_id=585, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 06:16:01.763303+00:00 +INFO - Started process 1903 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskLoad', 'manual__2022-11-10T06:16:01.763303+00:00', '--job-id', '585', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmpihb_e7mn'] +INFO - Job 585: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T06:16:01.763303+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T06:16:01.763303+00:00 +INFO - '2022-11-10' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-10' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-10' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-10' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fcc54296ca0> +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-10' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-10' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/dipa-s3/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'Ns/IH5x79yHNcYRwN19JbQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/dipa-s3/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'dipa-s3'}}} +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-10' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/dipa-s3/GBUNComahue_process.txt +INFO - '2022-11-10' - botocore.utils - URI updated to: https://dipa-s3.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-10' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-10' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:Ns/IH5x79yHNcYRwN19JbQ== +host:dipa-s3.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221110T061612Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-10' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221110T061612Z +20221110/us-east-1/s3/aws4_request +c7c6d77cbbe02d7119710b91d7d0c363a0fbfee6c96bae5c09baef667367bdfd +INFO - '2022-11-10' - botocore.auth - Signature: +f03c9d0ae3ca125fe212aa916b86f4b77044af8d8fac689c3741877c7b59ddd3 +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Sending http request: +INFO - '2022-11-10' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTPS connection (1): dipa-s3.s3.amazonaws.com:443 +INFO - '2022-11-10' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-10' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-10' - urllib3.connectionpool - https://dipa-s3.s3.amazonaws.com:443 "PUT /GBUNComahue_process.txt HTTP/1.1" 200 0 +INFO - '2022-11-10' - botocore.parsers - Response headers: {'x-amz-id-2': 'dz6qqIR+4ZNRYmc+HzWZkKUi+A/zrckTlObTvOfKjzvNgIfAVJiMbLqtIDeokByvUO27waTQCFs=', 'x-amz-request-id': 'F13YD4FX1T4KYSSB', 'Date': 'Thu, 10 Nov 2022 06:16:12 GMT', 'ETag': '"36cfc81f9c7bf721cd718470375f496d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-10' - botocore.parsers - Response body: +b'' +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.retryhandler - No retry needed. +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, execution_date=20221110T061601, start_date=20221110T061611, end_date=20221110T061613 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskLoad airflow_run_id=manual__2022-11-10T06:16:01.763303+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskLoad: TaskMetadata(name='GBUNComahue_dag_elt.TaskLoad', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskLoad', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskLoad', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskTransform'}, 'downstream_task_ids': set(), 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T06:16:13.907943Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d1bbf407-f00c-4b77-9b1a-9db8e23dea75"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27216\357\200\27201.763303+00\357\200\27200/task_id=TaskTransform/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27216\357\200\27201.763303+00\357\200\27200/task_id=TaskTransform/attempt=1.log" new file mode 100644 index 00000000..05e97c1d --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27216\357\200\27201.763303+00\357\200\27200/task_id=TaskTransform/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:16:06.939266Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskLoad'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskExtract'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T06:16:01.763303Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "d2e6f074-7327-3335-b623-8a77bdced34c"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "d2e6f074-7327-3335-b623-8a77bdced34c"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "67fdf32a-8ca3-411b-8646-1b9d2a1cb860"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskTransform, dagrun_id=manual__2022-11-10T06:16:01.763303+00:00, map_index=-1, run_start_date=2022-11-10 06:16:06.939266+00:00, try_number=1, job_id=584, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 06:16:01.763303+00:00 +INFO - Started process 1895 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskTransform', 'manual__2022-11-10T06:16:01.763303+00:00', '--job-id', '584', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmp49nus2ep'] +INFO - Job 584: Subtask TaskTransform +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskTransform +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T06:16:01.763303+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T06:16:01.763303+00:00 +INFO - '2022-11-10' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskTransform, execution_date=20221110T061601, start_date=20221110T061606, end_date=20221110T061609 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskTransform airflow_run_id=manual__2022-11-10T06:16:01.763303+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskTransform: TaskMetadata(name='GBUNComahue_dag_elt.TaskTransform', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskTransform', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskTransform', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskExtract'}, 'downstream_task_ids': {'TaskLoad'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T06:16:09.950259Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "67fdf32a-8ca3-411b-8646-1b9d2a1cb860"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27221\357\200\27253.307572+00\357\200\27200/task_id=TaskExtract/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27221\357\200\27253.307572+00\357\200\27200/task_id=TaskExtract/attempt=1.log" new file mode 100644 index 00000000..fb69a4bd --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27221\357\200\27253.307572+00\357\200\27200/task_id=TaskExtract/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:21:54.640155Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T06:21:53.307572Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "704802ad-be42-3fb5-8832-846703f01609"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "704802ad-be42-3fb5-8832-846703f01609"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8371ca45-7a53-407a-8d51-6130777ff83c"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, dagrun_id=manual__2022-11-10T06:21:53.307572+00:00, map_index=-1, run_start_date=2022-11-10 06:21:54.640155+00:00, try_number=1, job_id=595, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 06:21:53.307572+00:00 +INFO - Started process 2483 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskExtract', 'manual__2022-11-10T06:21:53.307572+00:00', '--job-id', '595', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmpb1yozjci'] +INFO - Job 595: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T06:21:53.307572+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T06:21:53.307572+00:00 +INFO - '2022-11-10' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-10' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-10' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-10' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, execution_date=20221110T062153, start_date=20221110T062154, end_date=20221110T062157 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskExtract airflow_run_id=manual__2022-11-10T06:21:53.307572+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskExtract: TaskMetadata(name='GBUNComahue_dag_elt.TaskExtract', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskExtract', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskExtract', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'TaskTransform'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T06:21:57.814158Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8371ca45-7a53-407a-8d51-6130777ff83c"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27221\357\200\27253.307572+00\357\200\27200/task_id=TaskLoad/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27221\357\200\27253.307572+00\357\200\27200/task_id=TaskLoad/attempt=1.log" new file mode 100644 index 00000000..8303dee4 --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27221\357\200\27253.307572+00\357\200\27200/task_id=TaskLoad/attempt=1.log" @@ -0,0 +1,124 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:22:02.793744Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T06:21:53.307572Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "704802ad-be42-3fb5-8832-846703f01609"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "704802ad-be42-3fb5-8832-846703f01609"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8420463e-e94e-4ff2-a388-4c5d88b9d2bb"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, dagrun_id=manual__2022-11-10T06:21:53.307572+00:00, map_index=-1, run_start_date=2022-11-10 06:22:02.793744+00:00, try_number=1, job_id=597, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 06:21:53.307572+00:00 +INFO - Started process 2529 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskLoad', 'manual__2022-11-10T06:21:53.307572+00:00', '--job-id', '597', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmpkqd5sreb'] +INFO - Job 597: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T06:21:53.307572+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T06:21:53.307572+00:00 +INFO - '2022-11-10' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-10' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-10' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-10' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fcc54276700> +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-10' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-10' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/dipa-s3/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'AgiCtq9PYLojIug2h+nTUw==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/dipa-s3/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'dipa-s3'}}} +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-10' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/dipa-s3/GBUNComahue_process.txt +INFO - '2022-11-10' - botocore.utils - URI updated to: https://dipa-s3.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-10' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-10' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:AgiCtq9PYLojIug2h+nTUw== +host:dipa-s3.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221110T062203Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-10' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221110T062203Z +20221110/us-east-1/s3/aws4_request +af584dda8c6d766c98918727ba08381f193279f7655adb76bce1ee825f710f00 +INFO - '2022-11-10' - botocore.auth - Signature: +acf599066cadfc1f48abb235728902456430f2d2ef2bcefa222ee3f4c1dd8678 +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Sending http request: +INFO - '2022-11-10' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTPS connection (1): dipa-s3.s3.amazonaws.com:443 +INFO - '2022-11-10' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-10' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-10' - urllib3.connectionpool - https://dipa-s3.s3.amazonaws.com:443 "PUT /GBUNComahue_process.txt HTTP/1.1" 200 0 +INFO - '2022-11-10' - botocore.parsers - Response headers: {'x-amz-id-2': 'GONB9taa3zZm7WcYbJpkDM1HcVLpp2EAa4PAZfJ4KTh+Aq0eyYYFjdqCv+4l6C4CRiCfSMeZhTVzWjjCASsnvw==', 'x-amz-request-id': 'NNKDNBRFC98THR41', 'Date': 'Thu, 10 Nov 2022 06:22:04 GMT', 'ETag': '"020882b6af4f60ba2322e83687e9d353"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-10' - botocore.parsers - Response body: +b'' +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.retryhandler - No retry needed. +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, execution_date=20221110T062153, start_date=20221110T062202, end_date=20221110T062205 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskLoad airflow_run_id=manual__2022-11-10T06:21:53.307572+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskLoad: TaskMetadata(name='GBUNComahue_dag_elt.TaskLoad', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskLoad', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskLoad', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskTransform'}, 'downstream_task_ids': set(), 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T06:22:05.134988Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8420463e-e94e-4ff2-a388-4c5d88b9d2bb"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27221\357\200\27253.307572+00\357\200\27200/task_id=TaskTransform/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27221\357\200\27253.307572+00\357\200\27200/task_id=TaskTransform/attempt=1.log" new file mode 100644 index 00000000..5df26c1c --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27221\357\200\27253.307572+00\357\200\27200/task_id=TaskTransform/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:21:59.291923Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskLoad'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskExtract'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T06:21:53.307572Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "704802ad-be42-3fb5-8832-846703f01609"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "704802ad-be42-3fb5-8832-846703f01609"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "51f426cd-6e06-4804-8706-62a058ee1cdf"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskTransform, dagrun_id=manual__2022-11-10T06:21:53.307572+00:00, map_index=-1, run_start_date=2022-11-10 06:21:59.291923+00:00, try_number=1, job_id=596, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 06:21:53.307572+00:00 +INFO - Started process 2503 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskTransform', 'manual__2022-11-10T06:21:53.307572+00:00', '--job-id', '596', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmp0nkv30j3'] +INFO - Job 596: Subtask TaskTransform +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskTransform +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T06:21:53.307572+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T06:21:53.307572+00:00 +INFO - '2022-11-10' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskTransform, execution_date=20221110T062153, start_date=20221110T062159, end_date=20221110T062202 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskTransform airflow_run_id=manual__2022-11-10T06:21:53.307572+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskTransform: TaskMetadata(name='GBUNComahue_dag_elt.TaskTransform', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskTransform', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskTransform', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskExtract'}, 'downstream_task_ids': {'TaskLoad'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T06:22:02.031573Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "51f426cd-6e06-4804-8706-62a058ee1cdf"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27235\357\200\27228.220443+00\357\200\27200/task_id=TaskExtract/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27235\357\200\27228.220443+00\357\200\27200/task_id=TaskExtract/attempt=1.log" new file mode 100644 index 00000000..f3426c3c --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27235\357\200\27228.220443+00\357\200\27200/task_id=TaskExtract/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:35:29.099998Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T06:35:28.220443Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "1a902fcf-d201-3e4e-91a4-dbd89d2f129e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "1a902fcf-d201-3e4e-91a4-dbd89d2f129e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "67f1af49-edf1-48dd-a7f5-d6084ecce5ee"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, dagrun_id=manual__2022-11-10T06:35:28.220443+00:00, map_index=-1, run_start_date=2022-11-10 06:35:29.099998+00:00, try_number=1, job_id=604, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 06:35:28.220443+00:00 +INFO - Started process 3884 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskExtract', 'manual__2022-11-10T06:35:28.220443+00:00', '--job-id', '604', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmps96p1xrw'] +INFO - Job 604: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T06:35:28.220443+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T06:35:28.220443+00:00 +INFO - '2022-11-10' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-10' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-10' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-10' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, execution_date=20221110T063528, start_date=20221110T063529, end_date=20221110T063532 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskExtract airflow_run_id=manual__2022-11-10T06:35:28.220443+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskExtract: TaskMetadata(name='GBUNComahue_dag_elt.TaskExtract', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskExtract', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskExtract', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'TaskTransform'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T06:35:32.546218Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "67f1af49-edf1-48dd-a7f5-d6084ecce5ee"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27235\357\200\27228.220443+00\357\200\27200/task_id=TaskLoad/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27235\357\200\27228.220443+00\357\200\27200/task_id=TaskLoad/attempt=1.log" new file mode 100644 index 00000000..5f0eff4f --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27235\357\200\27228.220443+00\357\200\27200/task_id=TaskLoad/attempt=1.log" @@ -0,0 +1,224 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:35:37.218613Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T06:35:28.220443Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "1a902fcf-d201-3e4e-91a4-dbd89d2f129e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "1a902fcf-d201-3e4e-91a4-dbd89d2f129e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e5a9171d-0748-4488-838a-77d29ba0176a"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, dagrun_id=manual__2022-11-10T06:35:28.220443+00:00, map_index=-1, run_start_date=2022-11-10 06:35:37.218613+00:00, try_number=1, job_id=606, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 06:35:28.220443+00:00 +INFO - Started process 3894 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskLoad', 'manual__2022-11-10T06:35:28.220443+00:00', '--job-id', '606', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmpdaimsnu8'] +INFO - Job 606: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T06:35:28.220443+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T06:35:28.220443+00:00 +INFO - '2022-11-10' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-10' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-10' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-10' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fcc54277700> +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-10' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-10' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/dipa-s3/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'v2jS2Q5VK0YrzUTKEpxbuQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/dipa-s3/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'dipa-s3'}}} +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-10' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/dipa-s3/GBUNComahue_process.txt +INFO - '2022-11-10' - botocore.utils - URI updated to: https://dipa-s3.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-10' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-10' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:v2jS2Q5VK0YrzUTKEpxbuQ== +host:dipa-s3.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221110T063537Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-10' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221110T063537Z +20221110/us-east-1/s3/aws4_request +0ab005ee5ca989038fd36a8b34dbce48999aec071618ac6322ccd668a2e3b74b +INFO - '2022-11-10' - botocore.auth - Signature: +48839e60da0210a126aba5290b03f14f973734a8d51c7be0bfd839af98af0968 +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Sending http request: +INFO - '2022-11-10' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTPS connection (1): dipa-s3.s3.amazonaws.com:443 +INFO - '2022-11-10' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-10' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.retryhandler - retry needed, retryable exception caught: Connection was closed before we received a valid response from endpoint URL: "https://dipa-s3.s3.amazonaws.com/GBUNComahue_process.txt". +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 449, in _make_request + six.raise_from(e, None) + File "", line 3, in raise_from + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 444, in _make_request + httplib_response = conn.getresponse() + File "/usr/local/lib/python3.9/http/client.py", line 1377, in getresponse + response.begin() + File "/usr/local/lib/python3.9/http/client.py", line 320, in begin + version, status, reason = self._read_status() + File "/usr/local/lib/python3.9/http/client.py", line 289, in _read_status + raise RemoteDisconnected("Remote end closed connection without" +http.client.RemoteDisconnected: Remote end closed connection without response + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 769, in reraise + raise value.with_traceback(tb) + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 449, in _make_request + six.raise_from(e, None) + File "", line 3, in raise_from + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 444, in _make_request + httplib_response = conn.getresponse() + File "/usr/local/lib/python3.9/http/client.py", line 1377, in getresponse + response.begin() + File "/usr/local/lib/python3.9/http/client.py", line 320, in begin + version, status, reason = self._read_status() + File "/usr/local/lib/python3.9/http/client.py", line 289, in _read_status + raise RemoteDisconnected("Remote end closed connection without" +urllib3.exceptions.ProtocolError: ('Connection aborted.', RemoteDisconnected('Remote end closed connection without response')) + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/retryhandler.py", line 307, in _should_retry + return self._checker( + File "/usr/local/lib/python3.9/site-packages/botocore/retryhandler.py", line 363, in __call__ + checker_response = checker( + File "/usr/local/lib/python3.9/site-packages/botocore/retryhandler.py", line 247, in __call__ + return self._check_caught_exception( + File "/usr/local/lib/python3.9/site-packages/botocore/retryhandler.py", line 416, in _check_caught_exception + raise caught_exception + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 281, in _do_get_response + http_response = self._send(request) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 377, in _send + return self.http_session.send(request) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 487, in send + raise ConnectionClosedError( +botocore.exceptions.ConnectionClosedError: Connection was closed before we received a valid response from endpoint URL: "https://dipa-s3.s3.amazonaws.com/GBUNComahue_process.txt". +INFO - '2022-11-10' - botocore.retryhandler - Retry needed, action of: 0.7949755117285345 +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.endpoint - Response received to retry, sleeping for 0.7949755117285345 seconds +INFO - '2022-11-10' - botocore.awsrequest - Rewinding stream: +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/dipa-s3/GBUNComahue_process.txt +INFO - '2022-11-10' - botocore.utils - URI updated to: https://dipa-s3.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-10' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-10' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:v2jS2Q5VK0YrzUTKEpxbuQ== +host:dipa-s3.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221110T063551Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-10' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221110T063551Z +20221110/us-east-1/s3/aws4_request +571ac79bf66f79acc3c9a24c9826ab68058a550c8e33a01a1bac29048b079290 +INFO - '2022-11-10' - botocore.auth - Signature: +862602bcefa1372d24cb1e118aee209e575a3a8068764182aa0ac22822e2c07a +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Sending http request: +INFO - '2022-11-10' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTPS connection (2): dipa-s3.s3.amazonaws.com:443 +INFO - '2022-11-10' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-10' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-10' - urllib3.connectionpool - https://dipa-s3.s3.amazonaws.com:443 "PUT /GBUNComahue_process.txt HTTP/1.1" 200 0 +INFO - '2022-11-10' - botocore.parsers - Response headers: {'x-amz-id-2': 'tsAc7s/PR+vKeM/U2d3T4CgqxVw0JFa5+HYOvgMwkzJU6jVeWe9eGrVceZsWcGD5SmEZfeDeWN4=', 'x-amz-request-id': 'GR7VK7X7C0JEXQ09', 'Date': 'Thu, 10 Nov 2022 06:35:59 GMT', 'ETag': '"bf68d2d90e552b462bcd44ca129c5bb9"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-10' - botocore.parsers - Response body: +b'' +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.retryhandler - No retry needed. +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, execution_date=20221110T063528, start_date=20221110T063537, end_date=20221110T063600 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskLoad airflow_run_id=manual__2022-11-10T06:35:28.220443+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskLoad: TaskMetadata(name='GBUNComahue_dag_elt.TaskLoad', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskLoad', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskLoad', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskTransform'}, 'downstream_task_ids': set(), 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T06:36:00.223491Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e5a9171d-0748-4488-838a-77d29ba0176a"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27235\357\200\27228.220443+00\357\200\27200/task_id=TaskTransform/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27235\357\200\27228.220443+00\357\200\27200/task_id=TaskTransform/attempt=1.log" new file mode 100644 index 00000000..65b81aa4 --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-10T06\357\200\27235\357\200\27228.220443+00\357\200\27200/task_id=TaskTransform/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:35:33.875576Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskLoad'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskExtract'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T06:35:28.220443Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "1a902fcf-d201-3e4e-91a4-dbd89d2f129e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "1a902fcf-d201-3e4e-91a4-dbd89d2f129e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "97ca5e7e-3bf0-45c0-9774-f5833f71adba"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskTransform, dagrun_id=manual__2022-11-10T06:35:28.220443+00:00, map_index=-1, run_start_date=2022-11-10 06:35:33.875576+00:00, try_number=1, job_id=605, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 06:35:28.220443+00:00 +INFO - Started process 3889 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskTransform', 'manual__2022-11-10T06:35:28.220443+00:00', '--job-id', '605', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmpmgboyn0l'] +INFO - Job 605: Subtask TaskTransform +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskTransform +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T06:35:28.220443+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T06:35:28.220443+00:00 +INFO - '2022-11-10' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskTransform, execution_date=20221110T063528, start_date=20221110T063533, end_date=20221110T063536 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskTransform airflow_run_id=manual__2022-11-10T06:35:28.220443+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskTransform: TaskMetadata(name='GBUNComahue_dag_elt.TaskTransform', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskTransform', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskTransform', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskExtract'}, 'downstream_task_ids': {'TaskLoad'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T06:35:36.329256Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "97ca5e7e-3bf0-45c0-9774-f5833f71adba"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-12T23\357\200\27218\357\200\27225.241753+00\357\200\27200/task_id=TaskExtract/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-12T23\357\200\27218\357\200\27225.241753+00\357\200\27200/task_id=TaskExtract/attempt=1.log" new file mode 100644 index 00000000..3294a55a --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-12T23\357\200\27218\357\200\27225.241753+00\357\200\27200/task_id=TaskExtract/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:18:29.157277Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-12T23:18:25.241753Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "74cd7adf-5c3d-37d0-a76d-e0e6b5e2761f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "74cd7adf-5c3d-37d0-a76d-e0e6b5e2761f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a19df9fd-b962-4b31-8f1b-9610f1b85398"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, dagrun_id=manual__2022-11-12T23:18:25.241753+00:00, map_index=-1, run_start_date=2022-11-12 23:18:29.157277+00:00, try_number=1, job_id=1111, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-12 23:18:25.241753+00:00 +INFO - Started process 216 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskExtract', 'manual__2022-11-12T23:18:25.241753+00:00', '--job-id', '1111', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpumnr8npm'] +INFO - Job 1111: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-12T23:18:25.241753+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-12T23:18:25.241753+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-12' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-12' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-12' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, execution_date=20221112T231825, start_date=20221112T231829, end_date=20221112T231833 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskExtract airflow_run_id=manual__2022-11-12T23:18:25.241753+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation TaskExtract: TaskMetadata(name='GBUNComahue_dag_elt.TaskExtract', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskExtract', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskExtract', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'TaskTransform'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:18:33.528841Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a19df9fd-b962-4b31-8f1b-9610f1b85398"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-12T23\357\200\27218\357\200\27225.241753+00\357\200\27200/task_id=TaskLoad/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-12T23\357\200\27218\357\200\27225.241753+00\357\200\27200/task_id=TaskLoad/attempt=1.log" new file mode 100644 index 00000000..dd76f334 --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-12T23\357\200\27218\357\200\27225.241753+00\357\200\27200/task_id=TaskLoad/attempt=1.log" @@ -0,0 +1,257 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:18:50.158785Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-12T23:18:25.241753Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "74cd7adf-5c3d-37d0-a76d-e0e6b5e2761f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "74cd7adf-5c3d-37d0-a76d-e0e6b5e2761f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1ee23058-86d7-47db-bc71-0f75a7002754"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, dagrun_id=manual__2022-11-12T23:18:25.241753+00:00, map_index=-1, run_start_date=2022-11-12 23:18:50.158785+00:00, try_number=1, job_id=1114, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-12 23:18:25.241753+00:00 +INFO - Started process 235 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskLoad', 'manual__2022-11-12T23:18:25.241753+00:00', '--job-id', '1114', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpcxftwmv4'] +INFO - Job 1114: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-12T23:18:25.241753+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-12T23:18:25.241753+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-12' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-12' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-12' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-12' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-12' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fd87712f670> +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-12' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-12' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNComahue_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - Marking task as UP_FOR_RETRY. dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, execution_date=20221112T231825, start_date=20221112T231850, end_date=20221112T231851 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 1114 for task TaskLoad (Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$"; 235) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-12T23\357\200\27218\357\200\27225.241753+00\357\200\27200/task_id=TaskLoad/attempt=2.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-12T23\357\200\27218\357\200\27225.241753+00\357\200\27200/task_id=TaskLoad/attempt=2.log" new file mode 100644 index 00000000..c3332bba --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-12T23\357\200\27218\357\200\27225.241753+00\357\200\27200/task_id=TaskLoad/attempt=2.log" @@ -0,0 +1,257 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 2 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:28:55.216160Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-12T23:18:25.241753Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "74cd7adf-5c3d-37d0-a76d-e0e6b5e2761f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "74cd7adf-5c3d-37d0-a76d-e0e6b5e2761f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a023db8f-8a1f-43e4-979b-833d94d78e7c"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, dagrun_id=manual__2022-11-12T23:18:25.241753+00:00, map_index=-1, run_start_date=2022-11-12 23:28:55.216160+00:00, try_number=2, job_id=1132, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-12 23:18:25.241753+00:00 +INFO - Started process 399 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskLoad', 'manual__2022-11-12T23:18:25.241753+00:00', '--job-id', '1132', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpojjp4c5w'] +INFO - Job 1132: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-12T23:18:25.241753+00:00 +AIRFLOW_CTX_TRY_NUMBER=2 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-12T23:18:25.241753+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-12' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-12' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-12' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-12' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-12' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fd8770eb310> +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-12' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-12' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNComahue_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - Marking task as UP_FOR_RETRY. dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, execution_date=20221112T231825, start_date=20221112T232855, end_date=20221112T232856 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 1132 for task TaskLoad (Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$"; 399) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-12T23\357\200\27218\357\200\27225.241753+00\357\200\27200/task_id=TaskLoad/attempt=3.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-12T23\357\200\27218\357\200\27225.241753+00\357\200\27200/task_id=TaskLoad/attempt=3.log" new file mode 100644 index 00000000..480b620e --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-12T23\357\200\27218\357\200\27225.241753+00\357\200\27200/task_id=TaskLoad/attempt=3.log" @@ -0,0 +1,257 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 3 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:39:00.119967Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-12T23:18:25.241753Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "74cd7adf-5c3d-37d0-a76d-e0e6b5e2761f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "74cd7adf-5c3d-37d0-a76d-e0e6b5e2761f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1da2920b-383a-4972-a9db-1156674c1b49"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, dagrun_id=manual__2022-11-12T23:18:25.241753+00:00, map_index=-1, run_start_date=2022-11-12 23:39:00.119967+00:00, try_number=3, job_id=1143, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-12 23:18:25.241753+00:00 +INFO - Started process 518 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskLoad', 'manual__2022-11-12T23:18:25.241753+00:00', '--job-id', '1143', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp1cpd_blg'] +INFO - Job 1143: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-12T23:18:25.241753+00:00 +AIRFLOW_CTX_TRY_NUMBER=3 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-12T23:18:25.241753+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-12' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-12' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-12' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-12' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-12' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fd87712e670> +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-12' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-12' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNComahue_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - Marking task as UP_FOR_RETRY. dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, execution_date=20221112T231825, start_date=20221112T233900, end_date=20221112T233901 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 1143 for task TaskLoad (Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$"; 518) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-12T23\357\200\27218\357\200\27225.241753+00\357\200\27200/task_id=TaskLoad/attempt=4.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-12T23\357\200\27218\357\200\27225.241753+00\357\200\27200/task_id=TaskLoad/attempt=4.log" new file mode 100644 index 00000000..74bb3020 --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-12T23\357\200\27218\357\200\27225.241753+00\357\200\27200/task_id=TaskLoad/attempt=4.log" @@ -0,0 +1,257 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 4 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:49:03.467815Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-12T23:18:25.241753Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "74cd7adf-5c3d-37d0-a76d-e0e6b5e2761f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "74cd7adf-5c3d-37d0-a76d-e0e6b5e2761f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1572379b-70b1-4419-ade5-1cb3eb3207dc"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, dagrun_id=manual__2022-11-12T23:18:25.241753+00:00, map_index=-1, run_start_date=2022-11-12 23:49:03.467815+00:00, try_number=4, job_id=1160, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-12 23:18:25.241753+00:00 +INFO - Started process 679 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskLoad', 'manual__2022-11-12T23:18:25.241753+00:00', '--job-id', '1160', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpdapon066'] +INFO - Job 1160: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-12T23:18:25.241753+00:00 +AIRFLOW_CTX_TRY_NUMBER=4 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-12T23:18:25.241753+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-12' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-12' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-12' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-12' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-12' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fd8770ec8b0> +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-12' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-12' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNComahue_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - Marking task as UP_FOR_RETRY. dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, execution_date=20221112T231825, start_date=20221112T234903, end_date=20221112T234904 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 1160 for task TaskLoad (Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$"; 679) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-12T23\357\200\27218\357\200\27225.241753+00\357\200\27200/task_id=TaskTransform/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-12T23\357\200\27218\357\200\27225.241753+00\357\200\27200/task_id=TaskTransform/attempt=1.log" new file mode 100644 index 00000000..e80b03a0 --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=manual__2022-11-12T23\357\200\27218\357\200\27225.241753+00\357\200\27200/task_id=TaskTransform/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:18:37.933471Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskLoad'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskExtract'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-12T23:18:25.241753Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "74cd7adf-5c3d-37d0-a76d-e0e6b5e2761f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "74cd7adf-5c3d-37d0-a76d-e0e6b5e2761f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e28423eb-6406-4230-a531-4b7c5e991f15"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskTransform, dagrun_id=manual__2022-11-12T23:18:25.241753+00:00, map_index=-1, run_start_date=2022-11-12 23:18:37.933471+00:00, try_number=1, job_id=1113, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-12 23:18:25.241753+00:00 +INFO - Started process 226 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskTransform', 'manual__2022-11-12T23:18:25.241753+00:00', '--job-id', '1113', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp7rkydb30'] +INFO - Job 1113: Subtask TaskTransform +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskTransform +AIRFLOW_CTX_EXECUTION_DATE=2022-11-12T23:18:25.241753+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-12T23:18:25.241753+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskTransform, execution_date=20221112T231825, start_date=20221112T231837, end_date=20221112T231847 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskTransform airflow_run_id=manual__2022-11-12T23:18:25.241753+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation TaskTransform: TaskMetadata(name='GBUNComahue_dag_elt.TaskTransform', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskTransform', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskTransform', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskExtract'}, 'downstream_task_ids': {'TaskLoad'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:18:47.522646Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e28423eb-6406-4230-a531-4b7c5e991f15"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27203\357\200\27238.668049+00\357\200\27200/task_id=TaskExtract/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27203\357\200\27238.668049+00\357\200\27200/task_id=TaskExtract/attempt=1.log" new file mode 100644 index 00000000..baea155e --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27203\357\200\27238.668049+00\357\200\27200/task_id=TaskExtract/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:03:39.596180Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T05:03:38.668049Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "c0c3ba2d-7440-3152-82b4-952b6ea52904"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "c0c3ba2d-7440-3152-82b4-952b6ea52904"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8861b6bc-3e2a-46ed-9378-5cb7df38759d"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, dagrun_id=scheduled__2022-11-10T05:03:38.668049+00:00, map_index=-1, run_start_date=2022-11-10 06:03:39.596180+00:00, try_number=1, job_id=575, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 05:03:38.668049+00:00 +INFO - Started process 673 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskExtract', 'scheduled__2022-11-10T05:03:38.668049+00:00', '--job-id', '575', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmpobat4fs0'] +INFO - Job 575: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T05:03:38.668049+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T05:03:38.668049+00:00 +INFO - '2022-11-10' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-10' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-10' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-10' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, execution_date=20221110T050338, start_date=20221110T060339, end_date=20221110T060343 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskExtract airflow_run_id=scheduled__2022-11-10T05:03:38.668049+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskExtract: TaskMetadata(name='GBUNComahue_dag_elt.TaskExtract', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskExtract', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskExtract', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'TaskTransform'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T06:03:43.089730Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8861b6bc-3e2a-46ed-9378-5cb7df38759d"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27203\357\200\27238.668049+00\357\200\27200/task_id=TaskLoad/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27203\357\200\27238.668049+00\357\200\27200/task_id=TaskLoad/attempt=1.log" new file mode 100644 index 00000000..6ea90a89 --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27203\357\200\27238.668049+00\357\200\27200/task_id=TaskLoad/attempt=1.log" @@ -0,0 +1,124 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:03:48.604173Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T05:03:38.668049Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "c0c3ba2d-7440-3152-82b4-952b6ea52904"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "c0c3ba2d-7440-3152-82b4-952b6ea52904"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "522ce595-c822-40cd-8fc1-df7b75208286"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, dagrun_id=scheduled__2022-11-10T05:03:38.668049+00:00, map_index=-1, run_start_date=2022-11-10 06:03:48.604173+00:00, try_number=1, job_id=577, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 05:03:38.668049+00:00 +INFO - Started process 683 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskLoad', 'scheduled__2022-11-10T05:03:38.668049+00:00', '--job-id', '577', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmpfq0ftw6l'] +INFO - Job 577: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T05:03:38.668049+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T05:03:38.668049+00:00 +INFO - '2022-11-10' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-10' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-10' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-10' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fcc33bd5b80> +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-10' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-10' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/dipa-s3/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'j1CgIyl1vTeuUDBLjWCwbA==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/dipa-s3/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'dipa-s3'}}} +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-10' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/dipa-s3/GBUNComahue_process.txt +INFO - '2022-11-10' - botocore.utils - URI updated to: https://dipa-s3.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-10' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-10' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:j1CgIyl1vTeuUDBLjWCwbA== +host:dipa-s3.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221110T060350Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-10' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221110T060350Z +20221110/us-east-1/s3/aws4_request +d9f0b94e0e99cf85d59e89b527c5a193912655667992fe5783a1beddfad15999 +INFO - '2022-11-10' - botocore.auth - Signature: +d2a02d75f9d654a92a10a00a172b35f9acad3fb3b7e40f800262241fec40fe37 +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Sending http request: +INFO - '2022-11-10' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTPS connection (1): dipa-s3.s3.amazonaws.com:443 +INFO - '2022-11-10' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-10' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-10' - urllib3.connectionpool - https://dipa-s3.s3.amazonaws.com:443 "PUT /GBUNComahue_process.txt HTTP/1.1" 200 0 +INFO - '2022-11-10' - botocore.parsers - Response headers: {'x-amz-id-2': '85y//sall7QVPyMH33F/ymbJNcxb9xUtgTRjbjUELhVI6w1CE+oEmGFG1vrpJp30GokT9lgHmTs=', 'x-amz-request-id': 'BT7NH4JXY2R03K07', 'Date': 'Thu, 10 Nov 2022 06:03:50 GMT', 'ETag': '"8f50a0232975bd37ae50304b8d60b06c"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-10' - botocore.parsers - Response body: +b'' +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.retryhandler - No retry needed. +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, execution_date=20221110T050338, start_date=20221110T060348, end_date=20221110T060354 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskLoad airflow_run_id=scheduled__2022-11-10T05:03:38.668049+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskLoad: TaskMetadata(name='GBUNComahue_dag_elt.TaskLoad', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskLoad', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskLoad', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskTransform'}, 'downstream_task_ids': set(), 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T06:03:54.693748Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "522ce595-c822-40cd-8fc1-df7b75208286"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27203\357\200\27238.668049+00\357\200\27200/task_id=TaskTransform/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27203\357\200\27238.668049+00\357\200\27200/task_id=TaskTransform/attempt=1.log" new file mode 100644 index 00000000..4416fcb1 --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27203\357\200\27238.668049+00\357\200\27200/task_id=TaskTransform/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:03:43.645283Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskLoad'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskExtract'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T05:03:38.668049Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "c0c3ba2d-7440-3152-82b4-952b6ea52904"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "c0c3ba2d-7440-3152-82b4-952b6ea52904"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f16f049b-f3de-4008-b566-17f26fdca2e7"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskTransform, dagrun_id=scheduled__2022-11-10T05:03:38.668049+00:00, map_index=-1, run_start_date=2022-11-10 06:03:43.645283+00:00, try_number=1, job_id=576, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 05:03:38.668049+00:00 +INFO - Started process 678 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskTransform', 'scheduled__2022-11-10T05:03:38.668049+00:00', '--job-id', '576', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmp8zbmj4iq'] +INFO - Job 576: Subtask TaskTransform +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskTransform +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T05:03:38.668049+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T05:03:38.668049+00:00 +INFO - '2022-11-10' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskTransform, execution_date=20221110T050338, start_date=20221110T060343, end_date=20221110T060347 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskTransform airflow_run_id=scheduled__2022-11-10T05:03:38.668049+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskTransform: TaskMetadata(name='GBUNComahue_dag_elt.TaskTransform', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskTransform', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskTransform', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskExtract'}, 'downstream_task_ids': {'TaskLoad'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T06:03:47.399956Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f16f049b-f3de-4008-b566-17f26fdca2e7"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27211\357\200\27221.828118+00\357\200\27200/task_id=TaskExtract/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27211\357\200\27221.828118+00\357\200\27200/task_id=TaskExtract/attempt=1.log" new file mode 100644 index 00000000..b32344b2 --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27211\357\200\27221.828118+00\357\200\27200/task_id=TaskExtract/attempt=1.log" @@ -0,0 +1,51 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:11:38.581829Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "_TaskDecorator(function=, operator_class=, multiple_outputs=False, kwargs={'task_id': 'extract'})", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "_TaskDecorator(function=, operator_class=, multiple_outputs=False, kwargs={'task_id': 'extract'})", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T05:11:21.828118Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "41e541ed-b159-352a-86d4-fb688b8288f1"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "41e541ed-b159-352a-86d4-fb688b8288f1"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": {"decorator_name": "task", "function": "<>", "kwargs": {"task_id": "extract"}, "multiple_outputs": false, "operator_class": "<>"}, "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": {"decorator_name": "task", "function": "<>", "kwargs": {"task_id": "extract"}, "multiple_outputs": false, "operator_class": "<>"}, "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bcc7eb1c-fc63-43c4-b769-ca1231fa84e2"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, dagrun_id=scheduled__2022-11-10T05:11:21.828118+00:00, map_index=-1, run_start_date=2022-11-10 06:11:38.581829+00:00, try_number=1, job_id=580, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 05:11:21.828118+00:00 +INFO - Started process 1418 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskExtract', 'scheduled__2022-11-10T05:11:21.828118+00:00', '--job-id', '580', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmphjonz_d_'] +INFO - Job 580: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T05:11:21.828118+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T05:11:21.828118+00:00 +INFO - Done. Returned value was: {{ task_instance.xcom_pull(task_ids='extract', dag_id='adhoc_airflow', key='return_value') }} +ERROR - Could not serialize the XCom value into JSON. If you are using pickle instead of JSON for XCom, then you need to enable pickle support for XCom in your airflow config. +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/utils/session.py", line 72, in wrapper + return func(*args, **kwargs) + File "/usr/local/lib/python3.9/site-packages/airflow/models/taskinstance.py", line 2378, in xcom_push + XCom.set( + File "/usr/local/lib/python3.9/site-packages/airflow/utils/session.py", line 72, in wrapper + return func(*args, **kwargs) + File "/usr/local/lib/python3.9/site-packages/airflow/models/xcom.py", line 206, in set + value = cls.serialize_value( + File "/usr/local/lib/python3.9/site-packages/airflow/models/xcom.py", line 597, in serialize_value + return json.dumps(value).encode('UTF-8') + File "/usr/local/lib/python3.9/json/__init__.py", line 231, in dumps + return _default_encoder.encode(obj) + File "/usr/local/lib/python3.9/json/encoder.py", line 199, in encode + chunks = self.iterencode(o, _one_shot=True) + File "/usr/local/lib/python3.9/json/encoder.py", line 257, in iterencode + return _iterencode(o, 0) + File "/usr/local/lib/python3.9/json/encoder.py", line 179, in default + raise TypeError(f'Object of type {o.__class__.__name__} ' +TypeError: Object of type PlainXComArg is not JSON serializable +INFO - Marking task as UP_FOR_RETRY. dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, execution_date=20221110T051121, start_date=20221110T061138, end_date=20221110T061139 +ERROR - Failed to execute job 580 for task TaskExtract (Object of type PlainXComArg is not JSON serializable; 1418) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27211\357\200\27221.828118+00\357\200\27200/task_id=TaskExtract/attempt=2.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27211\357\200\27221.828118+00\357\200\27200/task_id=TaskExtract/attempt=2.log" new file mode 100644 index 00000000..7976e562 --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27211\357\200\27221.828118+00\357\200\27200/task_id=TaskExtract/attempt=2.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 2 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:21:39.913182Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T05:11:21.828118Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "41e541ed-b159-352a-86d4-fb688b8288f1"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "41e541ed-b159-352a-86d4-fb688b8288f1"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e3cabba2-9cf1-409c-b911-24906dbca2c2"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, dagrun_id=scheduled__2022-11-10T05:11:21.828118+00:00, map_index=-1, run_start_date=2022-11-10 06:21:39.913182+00:00, try_number=2, job_id=589, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 05:11:21.828118+00:00 +INFO - Started process 2452 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskExtract', 'scheduled__2022-11-10T05:11:21.828118+00:00', '--job-id', '589', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmpkatdxv4q'] +INFO - Job 589: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T05:11:21.828118+00:00 +AIRFLOW_CTX_TRY_NUMBER=2 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T05:11:21.828118+00:00 +INFO - '2022-11-10' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-10' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-10' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-10' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, execution_date=20221110T051121, start_date=20221110T062139, end_date=20221110T062143 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskExtract airflow_run_id=scheduled__2022-11-10T05:11:21.828118+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskExtract: TaskMetadata(name='GBUNComahue_dag_elt.TaskExtract', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskExtract', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskExtract', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'TaskTransform'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T06:21:43.176053Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e3cabba2-9cf1-409c-b911-24906dbca2c2"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27211\357\200\27221.828118+00\357\200\27200/task_id=TaskLoad/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27211\357\200\27221.828118+00\357\200\27200/task_id=TaskLoad/attempt=1.log" new file mode 100644 index 00000000..7856ffa6 --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27211\357\200\27221.828118+00\357\200\27200/task_id=TaskLoad/attempt=1.log" @@ -0,0 +1,168 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:21:47.828898Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T05:11:21.828118Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "41e541ed-b159-352a-86d4-fb688b8288f1"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "41e541ed-b159-352a-86d4-fb688b8288f1"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f363ead2-f2bf-4617-b092-a4035e812e62"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, dagrun_id=scheduled__2022-11-10T05:11:21.828118+00:00, map_index=-1, run_start_date=2022-11-10 06:21:47.828898+00:00, try_number=1, job_id=593, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 05:11:21.828118+00:00 +INFO - Started process 2473 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskLoad', 'scheduled__2022-11-10T05:11:21.828118+00:00', '--job-id', '593', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmp2r34dc3l'] +INFO - Job 593: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T05:11:21.828118+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T05:11:21.828118+00:00 +INFO - '2022-11-10' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-10' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-10' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-10' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fcc542848b0> +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-10' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-10' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/dipa-s3/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'r53hmRPSCIRyITb6RL7Qdw==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/dipa-s3/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'dipa-s3'}}} +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-10' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/dipa-s3/GBUNComahue_process.txt +INFO - '2022-11-10' - botocore.utils - URI updated to: https://dipa-s3.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-10' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-10' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:r53hmRPSCIRyITb6RL7Qdw== +host:dipa-s3.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221110T062148Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-10' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221110T062148Z +20221110/us-east-1/s3/aws4_request +b682353e2184570d1d35a8b9c1851258065bbd7e5662be7fbcffd4dccb6f62f5 +INFO - '2022-11-10' - botocore.auth - Signature: +d220e52be653b15046c7ca42a31315776563835a6982f8d3ad9856c01448fe4c +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Sending http request: +INFO - '2022-11-10' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTPS connection (1): dipa-s3.s3.amazonaws.com:443 +INFO - '2022-11-10' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-10' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-10' - urllib3.connectionpool - https://dipa-s3.s3.amazonaws.com:443 "PUT /GBUNComahue_process.txt HTTP/1.1" 503 None +INFO - '2022-11-10' - botocore.parsers - Response headers: {'x-amz-request-id': '42BPFVNPKRV869JY', 'x-amz-id-2': 'Sh/vX6fObnmBlzGlb1bFauRKkesyOabAzkDzUdXVPIxiQtaG5/KmGHfV1vZoX5RrJemEJ2S01OE=', 'Content-Type': 'application/xml', 'Transfer-Encoding': 'chunked', 'Date': 'Thu, 10 Nov 2022 06:21:48 GMT', 'Server': 'AmazonS3', 'Connection': 'close'} +INFO - '2022-11-10' - botocore.parsers - Response body: +b'\nSlowDownPlease reduce your request rate.42BPFVNPKRV869JYSh/vX6fObnmBlzGlb1bFauRKkesyOabAzkDzUdXVPIxiQtaG5/KmGHfV1vZoX5RrJemEJ2S01OE=' +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.retryhandler - retry needed: retryable HTTP status code received: 503 +INFO - '2022-11-10' - botocore.retryhandler - Retry needed, action of: 0.022834795661573093 +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.endpoint - Response received to retry, sleeping for 0.022834795661573093 seconds +INFO - '2022-11-10' - botocore.awsrequest - Rewinding stream: +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/dipa-s3/GBUNComahue_process.txt +INFO - '2022-11-10' - botocore.utils - URI updated to: https://dipa-s3.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-10' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-10' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:r53hmRPSCIRyITb6RL7Qdw== +host:dipa-s3.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221110T062150Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-10' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221110T062150Z +20221110/us-east-1/s3/aws4_request +a60a0d7896fae6baeca5a0c622e683e4a9be182fb4577eeb742405d1fc8301d9 +INFO - '2022-11-10' - botocore.auth - Signature: +632a891a6170cfefe9e5af092868e5c75576eaacb9871086101c56a4d5a7dd33 +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Sending http request: +INFO - '2022-11-10' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-10' - urllib3.connectionpool - Resetting dropped connection: dipa-s3.s3.amazonaws.com +INFO - '2022-11-10' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-10' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-10' - urllib3.connectionpool - https://dipa-s3.s3.amazonaws.com:443 "PUT /GBUNComahue_process.txt HTTP/1.1" 200 0 +INFO - '2022-11-10' - botocore.parsers - Response headers: {'x-amz-id-2': '37h6h9606UDqnqqVtT4/94Ay/vreAgft8jV+4+GAq39TybhWunf0DFpwtVHI4VlzixJu8p3eENA=', 'x-amz-request-id': 'T5GD1X7P6X1032SK', 'Date': 'Thu, 10 Nov 2022 06:21:50 GMT', 'ETag': '"af9de19913d20884722136fa44bed077"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-10' - botocore.parsers - Response body: +b'' +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.retryhandler - No retry needed. +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, execution_date=20221110T051121, start_date=20221110T062147, end_date=20221110T062151 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskLoad airflow_run_id=scheduled__2022-11-10T05:11:21.828118+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskLoad: TaskMetadata(name='GBUNComahue_dag_elt.TaskLoad', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskLoad', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskLoad', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskTransform'}, 'downstream_task_ids': set(), 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T06:21:51.620323Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f363ead2-f2bf-4617-b092-a4035e812e62"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27211\357\200\27221.828118+00\357\200\27200/task_id=TaskTransform/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27211\357\200\27221.828118+00\357\200\27200/task_id=TaskTransform/attempt=1.log" new file mode 100644 index 00000000..c377d291 --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27211\357\200\27221.828118+00\357\200\27200/task_id=TaskTransform/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:21:43.933205Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskLoad'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskExtract'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T05:11:21.828118Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "41e541ed-b159-352a-86d4-fb688b8288f1"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "41e541ed-b159-352a-86d4-fb688b8288f1"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a199c794-6681-4a0b-a07d-453f4ff0b312"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskTransform, dagrun_id=scheduled__2022-11-10T05:11:21.828118+00:00, map_index=-1, run_start_date=2022-11-10 06:21:43.933205+00:00, try_number=1, job_id=592, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 05:11:21.828118+00:00 +INFO - Started process 2463 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskTransform', 'scheduled__2022-11-10T05:11:21.828118+00:00', '--job-id', '592', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmpqzizoz3x'] +INFO - Job 592: Subtask TaskTransform +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskTransform +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T05:11:21.828118+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T05:11:21.828118+00:00 +INFO - '2022-11-10' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskTransform, execution_date=20221110T051121, start_date=20221110T062143, end_date=20221110T062147 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskTransform airflow_run_id=scheduled__2022-11-10T05:11:21.828118+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskTransform: TaskMetadata(name='GBUNComahue_dag_elt.TaskTransform', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskTransform', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskTransform', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskExtract'}, 'downstream_task_ids': {'TaskLoad'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T06:21:47.062957Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a199c794-6681-4a0b-a07d-453f4ff0b312"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T06\357\200\27211\357\200\27221.828118+00\357\200\27200/task_id=TaskExtract/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T06\357\200\27211\357\200\27221.828118+00\357\200\27200/task_id=TaskExtract/attempt=1.log" new file mode 100644 index 00000000..7f512821 --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T06\357\200\27211\357\200\27221.828118+00\357\200\27200/task_id=TaskExtract/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T07:11:22.533189Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T06:11:21.828118Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "831219ee-b73c-35b0-a75f-6bfbb9ceeb41"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "831219ee-b73c-35b0-a75f-6bfbb9ceeb41"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8b4f6b7a-82fb-40f7-8bd5-b3c3beabbd35"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, dagrun_id=scheduled__2022-11-10T06:11:21.828118+00:00, map_index=-1, run_start_date=2022-11-10 07:11:22.533189+00:00, try_number=1, job_id=610, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 06:11:21.828118+00:00 +INFO - Started process 7433 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskExtract', 'scheduled__2022-11-10T06:11:21.828118+00:00', '--job-id', '610', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmp_5w4wjy8'] +INFO - Job 610: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T06:11:21.828118+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T06:11:21.828118+00:00 +INFO - '2022-11-10' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-10' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-10' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-10' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, execution_date=20221110T061121, start_date=20221110T071122, end_date=20221110T071125 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskExtract airflow_run_id=scheduled__2022-11-10T06:11:21.828118+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskExtract: TaskMetadata(name='GBUNComahue_dag_elt.TaskExtract', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskExtract', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskExtract', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'TaskTransform'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T07:11:25.531115Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8b4f6b7a-82fb-40f7-8bd5-b3c3beabbd35"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T06\357\200\27211\357\200\27221.828118+00\357\200\27200/task_id=TaskLoad/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T06\357\200\27211\357\200\27221.828118+00\357\200\27200/task_id=TaskLoad/attempt=1.log" new file mode 100644 index 00000000..1a4dc3c0 --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T06\357\200\27211\357\200\27221.828118+00\357\200\27200/task_id=TaskLoad/attempt=1.log" @@ -0,0 +1,124 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T07:11:31.104516Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T06:11:21.828118Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "831219ee-b73c-35b0-a75f-6bfbb9ceeb41"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "831219ee-b73c-35b0-a75f-6bfbb9ceeb41"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5182c925-4780-4a69-831b-900ca4469ddb"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, dagrun_id=scheduled__2022-11-10T06:11:21.828118+00:00, map_index=-1, run_start_date=2022-11-10 07:11:31.104516+00:00, try_number=1, job_id=612, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 06:11:21.828118+00:00 +INFO - Started process 7443 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskLoad', 'scheduled__2022-11-10T06:11:21.828118+00:00', '--job-id', '612', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmpvkc_hyel'] +INFO - Job 612: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T06:11:21.828118+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T06:11:21.828118+00:00 +INFO - '2022-11-10' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-10' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-10' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-10' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fcc54278820> +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-10' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-10' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/dipa-s3/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'I94l6hmz9Cg7/S0w9RqLAg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/dipa-s3/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'dipa-s3'}}} +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-10' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/dipa-s3/GBUNComahue_process.txt +INFO - '2022-11-10' - botocore.utils - URI updated to: https://dipa-s3.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-10' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-10' - botocore.auth - CanonicalRequest: +PUT +/GBUNComahue_process.txt + +content-md5:I94l6hmz9Cg7/S0w9RqLAg== +host:dipa-s3.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221110T071131Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-10' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221110T071131Z +20221110/us-east-1/s3/aws4_request +8b8503d4d06a09e5facfbc411f2f43efb6485aa05a4269ae0b94191d1247bd16 +INFO - '2022-11-10' - botocore.auth - Signature: +be381db71c09dbc0580aa3aaac1642c866d269bec604d8494556208f784c3a8c +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Sending http request: +INFO - '2022-11-10' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTPS connection (1): dipa-s3.s3.amazonaws.com:443 +INFO - '2022-11-10' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-10' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-10' - urllib3.connectionpool - https://dipa-s3.s3.amazonaws.com:443 "PUT /GBUNComahue_process.txt HTTP/1.1" 200 0 +INFO - '2022-11-10' - botocore.parsers - Response headers: {'x-amz-id-2': 'TRjHZxwTAQ6yCeRXkIlVtG09743fD0jMz9lUDxMe7AvJwMz5NOnqbmXy6/hjJiP9CHAJzgKVzUk=', 'x-amz-request-id': 'D3WD38T1A6G5E4KJ', 'Date': 'Thu, 10 Nov 2022 07:11:32 GMT', 'ETag': '"23de25ea19b3f4283bfd2d30f51a8b02"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-10' - botocore.parsers - Response body: +b'' +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.retryhandler - No retry needed. +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, execution_date=20221110T061121, start_date=20221110T071131, end_date=20221110T071133 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskLoad airflow_run_id=scheduled__2022-11-10T06:11:21.828118+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskLoad: TaskMetadata(name='GBUNComahue_dag_elt.TaskLoad', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskLoad', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskLoad', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskTransform'}, 'downstream_task_ids': set(), 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T07:11:33.180266Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5182c925-4780-4a69-831b-900ca4469ddb"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T06\357\200\27211\357\200\27221.828118+00\357\200\27200/task_id=TaskTransform/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T06\357\200\27211\357\200\27221.828118+00\357\200\27200/task_id=TaskTransform/attempt=1.log" new file mode 100644 index 00000000..f93f19c5 --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T06\357\200\27211\357\200\27221.828118+00\357\200\27200/task_id=TaskTransform/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T07:11:26.623637Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskLoad'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskExtract'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T06:11:21.828118Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "831219ee-b73c-35b0-a75f-6bfbb9ceeb41"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "831219ee-b73c-35b0-a75f-6bfbb9ceeb41"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ef1d9248-22ec-4594-91be-eed3e8ed1a9a"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskTransform, dagrun_id=scheduled__2022-11-10T06:11:21.828118+00:00, map_index=-1, run_start_date=2022-11-10 07:11:26.623637+00:00, try_number=1, job_id=611, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 06:11:21.828118+00:00 +INFO - Started process 7438 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskTransform', 'scheduled__2022-11-10T06:11:21.828118+00:00', '--job-id', '611', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmpho6wor4d'] +INFO - Job 611: Subtask TaskTransform +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskTransform +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T06:11:21.828118+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T06:11:21.828118+00:00 +INFO - '2022-11-10' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskTransform, execution_date=20221110T061121, start_date=20221110T071126, end_date=20221110T071129 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskTransform airflow_run_id=scheduled__2022-11-10T06:11:21.828118+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskTransform: TaskMetadata(name='GBUNComahue_dag_elt.TaskTransform', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskTransform', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskTransform', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskExtract'}, 'downstream_task_ids': {'TaskLoad'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T07:11:29.751025Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ef1d9248-22ec-4594-91be-eed3e8ed1a9a"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T07\357\200\27211\357\200\27221.828118+00\357\200\27200/task_id=TaskExtract/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T07\357\200\27211\357\200\27221.828118+00\357\200\27200/task_id=TaskExtract/attempt=1.log" new file mode 100644 index 00000000..2510bd8c --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T07\357\200\27211\357\200\27221.828118+00\357\200\27200/task_id=TaskExtract/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T08:11:22.824142Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T07:11:21.828118Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "06a87121-b963-36c2-b6bc-c29f5223d7d1"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "06a87121-b963-36c2-b6bc-c29f5223d7d1"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cb45ec6f-cd9c-4f69-abc0-1775a7a4988d"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, dagrun_id=scheduled__2022-11-10T07:11:21.828118+00:00, map_index=-1, run_start_date=2022-11-10 08:11:22.824142+00:00, try_number=1, job_id=618, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 07:11:21.828118+00:00 +INFO - Started process 2429 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskExtract', 'scheduled__2022-11-10T07:11:21.828118+00:00', '--job-id', '618', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmpyy5u40xt'] +INFO - Job 618: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host d1b6a3478c83 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T07:11:21.828118+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T07:11:21.828118+00:00 +INFO - '2022-11-10' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-10' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-10' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-10' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, execution_date=20221110T071121, start_date=20221110T081122, end_date=20221110T081125 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskExtract airflow_run_id=scheduled__2022-11-10T07:11:21.828118+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskExtract: TaskMetadata(name='GBUNComahue_dag_elt.TaskExtract', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskExtract', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskExtract', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'TaskTransform'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T08:11:25.961690Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "cb45ec6f-cd9c-4f69-abc0-1775a7a4988d"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T07\357\200\27211\357\200\27221.828118+00\357\200\27200/task_id=TaskLoad/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T07\357\200\27211\357\200\27221.828118+00\357\200\27200/task_id=TaskLoad/attempt=1.log" new file mode 100644 index 00000000..53abaf2d --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T07\357\200\27211\357\200\27221.828118+00\357\200\27200/task_id=TaskLoad/attempt=1.log" @@ -0,0 +1,291 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T08:11:30.006274Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T07:11:21.828118Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "06a87121-b963-36c2-b6bc-c29f5223d7d1"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "06a87121-b963-36c2-b6bc-c29f5223d7d1"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8814c2cb-e518-41e4-b6cf-c5205b791ffc"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, dagrun_id=scheduled__2022-11-10T07:11:21.828118+00:00, map_index=-1, run_start_date=2022-11-10 08:11:30.006274+00:00, try_number=1, job_id=620, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 07:11:21.828118+00:00 +INFO - Started process 2444 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskLoad', 'scheduled__2022-11-10T07:11:21.828118+00:00', '--job-id', '620', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmpzobdcne2'] +INFO - Job 620: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host d1b6a3478c83 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T07:11:21.828118+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T07:11:21.828118+00:00 +INFO - '2022-11-10' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-10' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-10' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-10' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTP connection (1): 169.254.169.254:80 +INFO - '2022-11-10' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTP connection (2): 169.254.169.254:80 +INFO - '2022-11-10' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-10' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-10' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f228ee60700> +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-10' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-10' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/dipa-s3/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'x10vWCklRdwnFWV5GuU9dg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/dipa-s3/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'dipa-s3'}}} +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-10' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/dipa-s3/GBUNComahue_process.txt +INFO - '2022-11-10' - botocore.utils - URI updated to: https://dipa-s3.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-10' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 898, in _make_api_call + http, parsed_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 921, in _make_request + return self._endpoint.make_request(operation_model, request_dict) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 119, in make_request + return self._send_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 198, in _send_request + request = self.create_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 134, in create_request + self._event_emitter.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 103, in handler + return self.sign(operation_name, request) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 187, in sign + auth.add_auth(request) + File "/usr/local/lib/python3.9/site-packages/botocore/auth.py", line 407, in add_auth + raise NoCredentialsError() +botocore.exceptions.NoCredentialsError: Unable to locate credentials +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNComahue_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 898, in _make_api_call + http, parsed_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 921, in _make_request + return self._endpoint.make_request(operation_model, request_dict) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 119, in make_request + return self._send_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 198, in _send_request + request = self.create_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 134, in create_request + self._event_emitter.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 103, in handler + return self.sign(operation_name, request) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 187, in sign + auth.add_auth(request) + File "/usr/local/lib/python3.9/site-packages/botocore/auth.py", line 407, in add_auth + raise NoCredentialsError() +botocore.exceptions.NoCredentialsError: Unable to locate credentials +INFO - Marking task as UP_FOR_RETRY. dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, execution_date=20221110T071121, start_date=20221110T081130, end_date=20221110T081130 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 620 for task TaskLoad (Unable to locate credentials; 2444) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T07\357\200\27211\357\200\27221.828118+00\357\200\27200/task_id=TaskLoad/attempt=2.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T07\357\200\27211\357\200\27221.828118+00\357\200\27200/task_id=TaskLoad/attempt=2.log" new file mode 100644 index 00000000..bc5273e2 --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T07\357\200\27211\357\200\27221.828118+00\357\200\27200/task_id=TaskLoad/attempt=2.log" @@ -0,0 +1,291 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 2 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T08:21:31.200114Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T07:11:21.828118Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "06a87121-b963-36c2-b6bc-c29f5223d7d1"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "06a87121-b963-36c2-b6bc-c29f5223d7d1"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2cdd4e50-eb26-41db-a629-1c63694bda39"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, dagrun_id=scheduled__2022-11-10T07:11:21.828118+00:00, map_index=-1, run_start_date=2022-11-10 08:21:31.200114+00:00, try_number=2, job_id=624, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 07:11:21.828118+00:00 +INFO - Started process 3961 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskLoad', 'scheduled__2022-11-10T07:11:21.828118+00:00', '--job-id', '624', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmphil7xkdl'] +INFO - Job 624: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host d1b6a3478c83 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T07:11:21.828118+00:00 +AIRFLOW_CTX_TRY_NUMBER=2 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T07:11:21.828118+00:00 +INFO - '2022-11-10' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-10' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-10' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-10' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTP connection (1): 169.254.169.254:80 +INFO - '2022-11-10' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTP connection (2): 169.254.169.254:80 +INFO - '2022-11-10' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-10' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-10' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f228eed2e50> +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-10' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-10' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'dipa-s3', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/dipa-s3/GBUNComahue_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'x10vWCklRdwnFWV5GuU9dg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/dipa-s3/GBUNComahue_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'dipa-s3'}}} +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-10' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/dipa-s3/GBUNComahue_process.txt +INFO - '2022-11-10' - botocore.utils - URI updated to: https://dipa-s3.s3.amazonaws.com/GBUNComahue_process.txt +INFO - '2022-11-10' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 898, in _make_api_call + http, parsed_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 921, in _make_request + return self._endpoint.make_request(operation_model, request_dict) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 119, in make_request + return self._send_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 198, in _send_request + request = self.create_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 134, in create_request + self._event_emitter.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 103, in handler + return self.sign(operation_name, request) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 187, in sign + auth.add_auth(request) + File "/usr/local/lib/python3.9/site-packages/botocore/auth.py", line 407, in add_auth + raise NoCredentialsError() +botocore.exceptions.NoCredentialsError: Unable to locate credentials +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNComahue_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 898, in _make_api_call + http, parsed_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 921, in _make_request + return self._endpoint.make_request(operation_model, request_dict) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 119, in make_request + return self._send_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 198, in _send_request + request = self.create_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 134, in create_request + self._event_emitter.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 103, in handler + return self.sign(operation_name, request) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 187, in sign + auth.add_auth(request) + File "/usr/local/lib/python3.9/site-packages/botocore/auth.py", line 407, in add_auth + raise NoCredentialsError() +botocore.exceptions.NoCredentialsError: Unable to locate credentials +INFO - Marking task as UP_FOR_RETRY. dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, execution_date=20221110T071121, start_date=20221110T082131, end_date=20221110T082131 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 624 for task TaskLoad (Unable to locate credentials; 3961) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T07\357\200\27211\357\200\27221.828118+00\357\200\27200/task_id=TaskTransform/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T07\357\200\27211\357\200\27221.828118+00\357\200\27200/task_id=TaskTransform/attempt=1.log" new file mode 100644 index 00000000..6dd235ae --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-10T07\357\200\27211\357\200\27221.828118+00\357\200\27200/task_id=TaskTransform/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T08:11:26.704517Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskLoad'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskExtract'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T07:11:21.828118Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "06a87121-b963-36c2-b6bc-c29f5223d7d1"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "06a87121-b963-36c2-b6bc-c29f5223d7d1"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ea739f93-c671-4aa1-81f3-38e0c7002a1e"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskTransform, dagrun_id=scheduled__2022-11-10T07:11:21.828118+00:00, map_index=-1, run_start_date=2022-11-10 08:11:26.704517+00:00, try_number=1, job_id=619, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 07:11:21.828118+00:00 +INFO - Started process 2439 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskTransform', 'scheduled__2022-11-10T07:11:21.828118+00:00', '--job-id', '619', '--raw', '--subdir', 'DAGS_FOLDER/GBUNComahue_dag_elt.py', '--cfg-path', '/tmp/tmp6agiohci'] +INFO - Job 619: Subtask TaskTransform +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host d1b6a3478c83 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskTransform +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T07:11:21.828118+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T07:11:21.828118+00:00 +INFO - '2022-11-10' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskTransform, execution_date=20221110T071121, start_date=20221110T081126, end_date=20221110T081129 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskTransform airflow_run_id=scheduled__2022-11-10T07:11:21.828118+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskTransform: TaskMetadata(name='GBUNComahue_dag_elt.TaskTransform', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskTransform', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskTransform', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskExtract'}, 'downstream_task_ids': {'TaskLoad'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T08:11:29.236927Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ea739f93-c671-4aa1-81f3-38e0c7002a1e"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-12T22\357\200\27217\357\200\27200.506420+00\357\200\27200/task_id=TaskExtract/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-12T22\357\200\27217\357\200\27200.506420+00\357\200\27200/task_id=TaskExtract/attempt=1.log" new file mode 100644 index 00000000..2131e8eb --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-12T22\357\200\27217\357\200\27200.506420+00\357\200\27200/task_id=TaskExtract/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:18:29.069103Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-12T22:17:00.506420Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "54454f2d-4836-3fd1-ab08-da8354993b75"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "54454f2d-4836-3fd1-ab08-da8354993b75"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c31d63f8-6033-4491-97bf-a6d2d98d792b"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, dagrun_id=scheduled__2022-11-12T22:17:00.506420+00:00, map_index=-1, run_start_date=2022-11-12 23:18:29.069103+00:00, try_number=1, job_id=1110, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-12 22:17:00.506420+00:00 +INFO - Started process 214 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskExtract', 'scheduled__2022-11-12T22:17:00.506420+00:00', '--job-id', '1110', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpebs2sz5o'] +INFO - Job 1110: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-12T22:17:00.506420+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-12T22:17:00.506420+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - GBUNComahue_dag_elt +INFO - '2022-11-12' - GBUNComahue_dag_elt - Extract +INFO - '2022-11-12' - GBUNComahue_dag_elt - Connect: alkemy_db +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-12' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-12' - GBUNComahue_dag_elt - universidad ... correo_electronico +0 UNIV. NACIONAL DEL COMAHUE ... FRANKALEXANDRA@YAHOO.COM +1 UNIV. NACIONAL DEL COMAHUE ... TEDWARDS@GMAIL.COM +2 UNIV. NACIONAL DEL COMAHUE ... RICHARD76@GMAIL.COM +3 UNIV. NACIONAL DEL COMAHUE ... ODUFFY@YAHOO.COM +4 UNIV. NACIONAL DEL COMAHUE ... FOSTERCHASE@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskExtract, execution_date=20221112T221700, start_date=20221112T231829, end_date=20221112T231833 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskExtract airflow_run_id=scheduled__2022-11-12T22:17:00.506420+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation TaskExtract: TaskMetadata(name='GBUNComahue_dag_elt.TaskExtract', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskExtract', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskExtract', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'TaskTransform'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:18:33.666412Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c31d63f8-6033-4491-97bf-a6d2d98d792b"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-12T22\357\200\27217\357\200\27200.506420+00\357\200\27200/task_id=TaskLoad/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-12T22\357\200\27217\357\200\27200.506420+00\357\200\27200/task_id=TaskLoad/attempt=1.log" new file mode 100644 index 00000000..7ac459ee --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-12T22\357\200\27217\357\200\27200.506420+00\357\200\27200/task_id=TaskLoad/attempt=1.log" @@ -0,0 +1,257 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:18:50.174809Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-12T22:17:00.506420Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "54454f2d-4836-3fd1-ab08-da8354993b75"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "54454f2d-4836-3fd1-ab08-da8354993b75"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "555b1f0c-763f-4def-9a1e-5ca18a3e9d72"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, dagrun_id=scheduled__2022-11-12T22:17:00.506420+00:00, map_index=-1, run_start_date=2022-11-12 23:18:50.174809+00:00, try_number=1, job_id=1115, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-12 22:17:00.506420+00:00 +INFO - Started process 236 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskLoad', 'scheduled__2022-11-12T22:17:00.506420+00:00', '--job-id', '1115', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp1j8uu4sy'] +INFO - Job 1115: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-12T22:17:00.506420+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-12T22:17:00.506420+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-12' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-12' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-12' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-12' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-12' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fd87712f430> +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-12' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-12' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNComahue_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - Marking task as UP_FOR_RETRY. dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, execution_date=20221112T221700, start_date=20221112T231850, end_date=20221112T231851 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 1115 for task TaskLoad (Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$"; 236) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-12T22\357\200\27217\357\200\27200.506420+00\357\200\27200/task_id=TaskLoad/attempt=2.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-12T22\357\200\27217\357\200\27200.506420+00\357\200\27200/task_id=TaskLoad/attempt=2.log" new file mode 100644 index 00000000..d76baf5b --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-12T22\357\200\27217\357\200\27200.506420+00\357\200\27200/task_id=TaskLoad/attempt=2.log" @@ -0,0 +1,257 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 2 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:28:55.286601Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-12T22:17:00.506420Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "54454f2d-4836-3fd1-ab08-da8354993b75"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "54454f2d-4836-3fd1-ab08-da8354993b75"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bc6ecea8-2c51-4135-b745-b446702b1195"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, dagrun_id=scheduled__2022-11-12T22:17:00.506420+00:00, map_index=-1, run_start_date=2022-11-12 23:28:55.286601+00:00, try_number=2, job_id=1133, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-12 22:17:00.506420+00:00 +INFO - Started process 400 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskLoad', 'scheduled__2022-11-12T22:17:00.506420+00:00', '--job-id', '1133', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmply7p7nfl'] +INFO - Job 1133: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-12T22:17:00.506420+00:00 +AIRFLOW_CTX_TRY_NUMBER=2 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-12T22:17:00.506420+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-12' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-12' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-12' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-12' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-12' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fd8770ed310> +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-12' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-12' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNComahue_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - Marking task as UP_FOR_RETRY. dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, execution_date=20221112T221700, start_date=20221112T232855, end_date=20221112T232856 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 1133 for task TaskLoad (Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$"; 400) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-12T22\357\200\27217\357\200\27200.506420+00\357\200\27200/task_id=TaskLoad/attempt=3.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-12T22\357\200\27217\357\200\27200.506420+00\357\200\27200/task_id=TaskLoad/attempt=3.log" new file mode 100644 index 00000000..77185d72 --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-12T22\357\200\27217\357\200\27200.506420+00\357\200\27200/task_id=TaskLoad/attempt=3.log" @@ -0,0 +1,257 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 3 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:38:59.784114Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-12T22:17:00.506420Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "54454f2d-4836-3fd1-ab08-da8354993b75"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "54454f2d-4836-3fd1-ab08-da8354993b75"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ce10f392-1311-417c-ab5d-402d2cdceb10"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, dagrun_id=scheduled__2022-11-12T22:17:00.506420+00:00, map_index=-1, run_start_date=2022-11-12 23:38:59.784114+00:00, try_number=3, job_id=1142, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-12 22:17:00.506420+00:00 +INFO - Started process 515 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskLoad', 'scheduled__2022-11-12T22:17:00.506420+00:00', '--job-id', '1142', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmp3c2c1kq_'] +INFO - Job 1142: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-12T22:17:00.506420+00:00 +AIRFLOW_CTX_TRY_NUMBER=3 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-12T22:17:00.506420+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-12' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-12' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-12' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-12' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-12' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fd8771305e0> +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-12' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-12' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNComahue_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - Marking task as UP_FOR_RETRY. dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, execution_date=20221112T221700, start_date=20221112T233859, end_date=20221112T233900 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 1142 for task TaskLoad (Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$"; 515) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-12T22\357\200\27217\357\200\27200.506420+00\357\200\27200/task_id=TaskLoad/attempt=4.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-12T22\357\200\27217\357\200\27200.506420+00\357\200\27200/task_id=TaskLoad/attempt=4.log" new file mode 100644 index 00000000..87d06d06 --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-12T22\357\200\27217\357\200\27200.506420+00\357\200\27200/task_id=TaskLoad/attempt=4.log" @@ -0,0 +1,257 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 4 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:49:03.891566Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-12T22:17:00.506420Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "54454f2d-4836-3fd1-ab08-da8354993b75"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "54454f2d-4836-3fd1-ab08-da8354993b75"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e8043a27-7b42-4500-96b8-f48f4546bdd0"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, dagrun_id=scheduled__2022-11-12T22:17:00.506420+00:00, map_index=-1, run_start_date=2022-11-12 23:49:03.891566+00:00, try_number=4, job_id=1161, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-12 22:17:00.506420+00:00 +INFO - Started process 682 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskLoad', 'scheduled__2022-11-12T22:17:00.506420+00:00', '--job-id', '1161', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpqq3h_xbj'] +INFO - Job 1161: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-12T22:17:00.506420+00:00 +AIRFLOW_CTX_TRY_NUMBER=4 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-12T22:17:00.506420+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - Load: GBUNComahue_dag_elt +INFO - '2022-11-12' - GBUNComahue_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-12' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-12' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-12' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-12' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-12' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-12' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-12' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-12' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-12' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fd8771315e0> +INFO - '2022-11-12' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-12' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-12' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-12' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-12' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-12' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-12' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-12' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': '', 'key': 'GBUNComahue_process.txt', 'extra_args': {}} +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-12' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - '2022-11-12' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNComahue_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 878, in _make_api_call + request_dict = self._convert_to_request_dict( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 936, in _convert_to_request_dict + api_params = self._emit_api_params( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 969, in _emit_api_params + self.meta.events.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/handlers.py", line 275, in validate_bucket_name + raise ParamValidationError(report=error_msg) +botocore.exceptions.ParamValidationError: Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$" +INFO - Marking task as UP_FOR_RETRY. dag_id=GBUNComahue_dag_elt, task_id=TaskLoad, execution_date=20221112T221700, start_date=20221112T234903, end_date=20221112T234904 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 1161 for task TaskLoad (Parameter validation failed: +Invalid bucket name "": Bucket name must match the regex "^[a-zA-Z0-9.\-_]{1,255}$" or be an ARN matching the regex "^arn:(aws).*:(s3|s3-object-lambda):[a-z\-0-9]*:[0-9]{12}:accesspoint[/:][a-zA-Z0-9\-.]{1,63}$|^arn:(aws).*:s3-outposts:[a-z\-0-9]+:[0-9]{12}:outpost[/:][a-zA-Z0-9\-]{1,63}[/:]accesspoint[/:][a-zA-Z0-9\-]{1,63}$"; 682) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-12T22\357\200\27217\357\200\27200.506420+00\357\200\27200/task_id=TaskTransform/attempt=1.log" "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-12T22\357\200\27217\357\200\27200.506420+00\357\200\27200/task_id=TaskTransform/attempt=1.log" new file mode 100644 index 00000000..e8161dc6 --- /dev/null +++ "b/dags/logs/dag_id=GBUNComahue_dag_elt/run_id=scheduled__2022-11-12T22\357\200\27217\357\200\27200.506420+00\357\200\27200/task_id=TaskTransform/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-12T23:18:37.303719Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNComahue_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskLoad'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskExtract'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-12T22:17:00.506420Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "54454f2d-4836-3fd1-ab08-da8354993b75"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNComahue_dag_elt", "namespace": "default"}, "run": {"runId": "54454f2d-4836-3fd1-ab08-da8354993b75"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a771daa5-6ce1-4d0f-8c41-48cd58526247"}} +INFO - TaskInstance Details: dag_id=GBUNComahue_dag_elt, task_id=TaskTransform, dagrun_id=scheduled__2022-11-12T22:17:00.506420+00:00, map_index=-1, run_start_date=2022-11-12 23:18:37.303719+00:00, try_number=1, job_id=1112, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-12 22:17:00.506420+00:00 +INFO - Started process 223 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNComahue_dag_elt', 'TaskTransform', 'scheduled__2022-11-12T22:17:00.506420+00:00', '--job-id', '1112', '--raw', '--subdir', 'DAGS_FOLDER/factory.py', '--cfg-path', '/tmp/tmpecqlcy5c'] +INFO - Job 1112: Subtask TaskTransform +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 7a9af4658e35 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNComahue_dag_elt +AIRFLOW_CTX_TASK_ID=TaskTransform +AIRFLOW_CTX_EXECUTION_DATE=2022-11-12T22:17:00.506420+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-12T22:17:00.506420+00:00 +INFO - '2022-11-12' - GBUNComahue_dag_elt - Transform +INFO - ['GBUNComahue', 'select.csv'] +INFO - GBUNComahue +INFO - GBUNComahue_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNComahue_dag_elt, task_id=TaskTransform, execution_date=20221112T221700, start_date=20221112T231837, end_date=20221112T231846 +INFO - '2022-11-12' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-12' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-12' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNComahue_dag_elt task_id=TaskTransform airflow_run_id=scheduled__2022-11-12T22:17:00.506420+00:00 +INFO - '2022-11-12' - root - Found task metadata for operation TaskTransform: TaskMetadata(name='GBUNComahue_dag_elt.TaskTransform', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskTransform', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskTransform', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskExtract'}, 'downstream_task_ids': {'TaskLoad'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-12' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-12' - openlineage.client.transport.console - {"eventTime": "2022-11-12T23:18:46.922001Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNComahue_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a771daa5-6ce1-4d0f-8c41-48cd58526247"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27200\357\200\27256.675892+00\357\200\27200/task_id=TaskExtract/attempt=2.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27200\357\200\27256.675892+00\357\200\27200/task_id=TaskExtract/attempt=2.log" new file mode 100644 index 00000000..d12fa42a --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27200\357\200\27256.675892+00\357\200\27200/task_id=TaskExtract/attempt=2.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 2 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-09T19:11:09.777145Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-09T19:00:56.675892Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "f4f51ac9-6eba-33e0-8cc5-891ae1600f0e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "f4f51ac9-6eba-33e0-8cc5-891ae1600f0e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "36f4d8dc-7333-43bd-998a-649d2b8a1305"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, dagrun_id=manual__2022-11-09T19:00:56.675892+00:00, map_index=-1, run_start_date=2022-11-09 19:11:09.777145+00:00, try_number=2, job_id=547, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-09 19:00:56.675892+00:00 +INFO - Started process 801 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskExtract', 'manual__2022-11-09T19:00:56.675892+00:00', '--job-id', '547', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmp463ie2hh'] +INFO - Job 547: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 03a0f0f60b55 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-09T19:00:56.675892+00:00 +AIRFLOW_CTX_TRY_NUMBER=2 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-09T19:00:56.675892+00:00 +INFO - '2022-11-09' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-09' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-09' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-09' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-09' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-09' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, execution_date=20221109T190056, start_date=20221109T191109, end_date=20221109T191112 +INFO - '2022-11-09' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-09' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-09' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskExtract airflow_run_id=manual__2022-11-09T19:00:56.675892+00:00 +INFO - '2022-11-09' - root - Found task metadata for operation TaskExtract: TaskMetadata(name='GBUNSalvador_dag_elt.TaskExtract', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskExtract', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskExtract', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'TaskTransform'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-09' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-09' - openlineage.client.transport.console - {"eventTime": "2022-11-09T19:11:12.477450Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "36f4d8dc-7333-43bd-998a-649d2b8a1305"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27200\357\200\27256.675892+00\357\200\27200/task_id=TaskLoad/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27200\357\200\27256.675892+00\357\200\27200/task_id=TaskLoad/attempt=1.log" new file mode 100644 index 00000000..00068a80 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27200\357\200\27256.675892+00\357\200\27200/task_id=TaskLoad/attempt=1.log" @@ -0,0 +1,123 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-09T19:11:20.124049Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-09T19:00:56.675892Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "f4f51ac9-6eba-33e0-8cc5-891ae1600f0e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "f4f51ac9-6eba-33e0-8cc5-891ae1600f0e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a0464978-8b04-40b9-8c6d-6a758a4292d4"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, dagrun_id=manual__2022-11-09T19:00:56.675892+00:00, map_index=-1, run_start_date=2022-11-09 19:11:20.124049+00:00, try_number=1, job_id=550, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-09 19:00:56.675892+00:00 +INFO - Started process 825 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskLoad', 'manual__2022-11-09T19:00:56.675892+00:00', '--job-id', '550', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmphexnniow'] +INFO - Job 550: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 03a0f0f60b55 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-09T19:00:56.675892+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-09T19:00:56.675892+00:00 +INFO - '2022-11-09' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-09' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-09' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-09' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-09' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-09' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-09' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-09' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-09' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-09' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f289e622af0> +INFO - '2022-11-09' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-09' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-09' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-09' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-09' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-09' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-09' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-09' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-09' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-09' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-09' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-09' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-09' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/preprocess/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'jwkvOsqGaFnNoLEn5GvyaQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/preprocess/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-09' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/preprocess/GBUNSalvador_process.txt +INFO - '2022-11-09' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/preprocess/GBUNSalvador_process.txt +INFO - '2022-11-09' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-09' - botocore.auth - CanonicalRequest: +PUT +/preprocess/GBUNSalvador_process.txt + +content-md5:jwkvOsqGaFnNoLEn5GvyaQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221109T191121Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-09' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221109T191121Z +20221109/us-east-1/s3/aws4_request +479d6f2d753f5eee488d88711e1f23956d9bd8ae4b7b2b00342114e2555335bf +INFO - '2022-11-09' - botocore.auth - Signature: +abd5b75fadbc17dca76dd88a9dd7051bf69201fb5049f3140e34128bc55657a3 +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.endpoint - Sending http request: +INFO - '2022-11-09' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-09' - urllib3.connectionpool - Starting new HTTPS connection (1): alkemy-2022-broc.s3.amazonaws.com:443 +INFO - '2022-11-09' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-09' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-09' - urllib3.connectionpool - https://alkemy-2022-broc.s3.amazonaws.com:443 "PUT /preprocess/GBUNSalvador_process.txt HTTP/1.1" 200 0 +INFO - '2022-11-09' - botocore.parsers - Response headers: {'x-amz-id-2': 'H3GUvHzuXN0p5DJPrTPHH5GDV/6J33+FkrUvCsNB5b9jkzziJUAAgluNxmLy6NcSHigGH9u80SM=', 'x-amz-request-id': 'Q6VVT78PJ1SRGA05', 'Date': 'Wed, 09 Nov 2022 19:11:20 GMT', 'ETag': '"8f092f3aca866859cda0b127e46bf269"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-09' - botocore.parsers - Response body: +b'' +INFO - '2022-11-09' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.retryhandler - No retry needed. +INFO - '2022-11-09' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-09' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, execution_date=20221109T190056, start_date=20221109T191120, end_date=20221109T191122 +INFO - '2022-11-09' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-09' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-09' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskLoad airflow_run_id=manual__2022-11-09T19:00:56.675892+00:00 +INFO - '2022-11-09' - root - Found task metadata for operation TaskLoad: TaskMetadata(name='GBUNSalvador_dag_elt.TaskLoad', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskLoad', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskLoad', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskTransform'}, 'downstream_task_ids': set(), 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-09' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-09' - openlineage.client.transport.console - {"eventTime": "2022-11-09T19:11:22.809898Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a0464978-8b04-40b9-8c6d-6a758a4292d4"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27200\357\200\27256.675892+00\357\200\27200/task_id=TaskTransform/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27200\357\200\27256.675892+00\357\200\27200/task_id=TaskTransform/attempt=1.log" new file mode 100644 index 00000000..8cca0864 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27200\357\200\27256.675892+00\357\200\27200/task_id=TaskTransform/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-09T19:11:13.436708Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskLoad'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskExtract'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-09T19:00:56.675892Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "f4f51ac9-6eba-33e0-8cc5-891ae1600f0e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "f4f51ac9-6eba-33e0-8cc5-891ae1600f0e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "624ce4f9-9f14-4677-9f4b-1a5d6d2e0c2b"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskTransform, dagrun_id=manual__2022-11-09T19:00:56.675892+00:00, map_index=-1, run_start_date=2022-11-09 19:11:13.436708+00:00, try_number=1, job_id=548, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-09 19:00:56.675892+00:00 +INFO - Started process 806 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskTransform', 'manual__2022-11-09T19:00:56.675892+00:00', '--job-id', '548', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpon4_lvv0'] +INFO - Job 548: Subtask TaskTransform +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 03a0f0f60b55 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskTransform +AIRFLOW_CTX_EXECUTION_DATE=2022-11-09T19:00:56.675892+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-09T19:00:56.675892+00:00 +INFO - '2022-11-09' - GBUNSalvador_dag_elt - Transform +INFO - ['GBUNSalvador', 'select.csv'] +INFO - GBUNSalvador +INFO - GBUNSalvador_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskTransform, execution_date=20221109T190056, start_date=20221109T191113, end_date=20221109T191119 +INFO - '2022-11-09' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-09' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-09' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskTransform airflow_run_id=manual__2022-11-09T19:00:56.675892+00:00 +INFO - '2022-11-09' - root - Found task metadata for operation TaskTransform: TaskMetadata(name='GBUNSalvador_dag_elt.TaskTransform', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskTransform', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskTransform', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskExtract'}, 'downstream_task_ids': {'TaskLoad'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-09' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-09' - openlineage.client.transport.console - {"eventTime": "2022-11-09T19:11:19.415164Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "624ce4f9-9f14-4677-9f4b-1a5d6d2e0c2b"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27209\357\200\27254.391041+00\357\200\27200/task_id=TaskExtract/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27209\357\200\27254.391041+00\357\200\27200/task_id=TaskExtract/attempt=1.log" new file mode 100644 index 00000000..cd3de759 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27209\357\200\27254.391041+00\357\200\27200/task_id=TaskExtract/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-09T19:09:55.414388Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-09T19:09:54.391041Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "757b12ae-8a0e-3290-88f8-7f5acfa9e9ab"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "757b12ae-8a0e-3290-88f8-7f5acfa9e9ab"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "53447a5e-ea86-42d9-a6ad-30c04ae57f73"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, dagrun_id=manual__2022-11-09T19:09:54.391041+00:00, map_index=-1, run_start_date=2022-11-09 19:09:55.414388+00:00, try_number=1, job_id=541, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-09 19:09:54.391041+00:00 +INFO - Started process 662 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskExtract', 'manual__2022-11-09T19:09:54.391041+00:00', '--job-id', '541', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpverzfsm4'] +INFO - Job 541: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 03a0f0f60b55 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-09T19:09:54.391041+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-09T19:09:54.391041+00:00 +INFO - '2022-11-09' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-09' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-09' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-09' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-09' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-09' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, execution_date=20221109T190954, start_date=20221109T190955, end_date=20221109T190959 +INFO - '2022-11-09' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-09' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-09' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskExtract airflow_run_id=manual__2022-11-09T19:09:54.391041+00:00 +INFO - '2022-11-09' - root - Found task metadata for operation TaskExtract: TaskMetadata(name='GBUNSalvador_dag_elt.TaskExtract', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskExtract', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskExtract', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'TaskTransform'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-09' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-09' - openlineage.client.transport.console - {"eventTime": "2022-11-09T19:09:59.175405Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "53447a5e-ea86-42d9-a6ad-30c04ae57f73"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27209\357\200\27254.391041+00\357\200\27200/task_id=TaskLoad/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27209\357\200\27254.391041+00\357\200\27200/task_id=TaskLoad/attempt=1.log" new file mode 100644 index 00000000..2900179f --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27209\357\200\27254.391041+00\357\200\27200/task_id=TaskLoad/attempt=1.log" @@ -0,0 +1,123 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-09T19:10:08.287980Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-09T19:09:54.391041Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "757b12ae-8a0e-3290-88f8-7f5acfa9e9ab"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "757b12ae-8a0e-3290-88f8-7f5acfa9e9ab"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1028508c-09c2-49af-a5ed-73cb2e5c5cc8"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, dagrun_id=manual__2022-11-09T19:09:54.391041+00:00, map_index=-1, run_start_date=2022-11-09 19:10:08.287980+00:00, try_number=1, job_id=545, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-09 19:09:54.391041+00:00 +INFO - Started process 686 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskLoad', 'manual__2022-11-09T19:09:54.391041+00:00', '--job-id', '545', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmp17e8x99r'] +INFO - Job 545: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 03a0f0f60b55 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-09T19:09:54.391041+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-09T19:09:54.391041+00:00 +INFO - '2022-11-09' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-09' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-09' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-09' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-09' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-09' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-09' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-09' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-09' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-09' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f289e621e50> +INFO - '2022-11-09' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-09' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-09' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-09' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-09' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-09' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-09' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-09' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-09' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-09' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-09' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-09' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-09' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/preprocess/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'gncXnYr6XgHPDadrOsmeBg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/preprocess/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-09' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/preprocess/GBUNSalvador_process.txt +INFO - '2022-11-09' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/preprocess/GBUNSalvador_process.txt +INFO - '2022-11-09' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-09' - botocore.auth - CanonicalRequest: +PUT +/preprocess/GBUNSalvador_process.txt + +content-md5:gncXnYr6XgHPDadrOsmeBg== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221109T191009Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-09' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221109T191009Z +20221109/us-east-1/s3/aws4_request +4440537cb2c119d2103d84bb1ff197a3a0860cd783a342713f352840a3727365 +INFO - '2022-11-09' - botocore.auth - Signature: +85f1a4b9c6e7a07477b78e556d6a7fa16bd75fa76f8ba0f1fd3ecbfd8db419df +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.endpoint - Sending http request: +INFO - '2022-11-09' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-09' - urllib3.connectionpool - Starting new HTTPS connection (1): alkemy-2022-broc.s3.amazonaws.com:443 +INFO - '2022-11-09' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-09' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-09' - urllib3.connectionpool - https://alkemy-2022-broc.s3.amazonaws.com:443 "PUT /preprocess/GBUNSalvador_process.txt HTTP/1.1" 200 0 +INFO - '2022-11-09' - botocore.parsers - Response headers: {'x-amz-id-2': '6ORUbqNM2eYjZzihCzi0WrVhyuNOckBgQx8i0vvYFnPrlMod1pJQ8uaVfqRdUEKEibb4rKQhjhw=', 'x-amz-request-id': 'N9J9FBWXSN6NTWS1', 'Date': 'Wed, 09 Nov 2022 19:10:08 GMT', 'ETag': '"8277179d8afa5e01cf0da76b3ac99e06"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-09' - botocore.parsers - Response body: +b'' +INFO - '2022-11-09' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.retryhandler - No retry needed. +INFO - '2022-11-09' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-09' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, execution_date=20221109T190954, start_date=20221109T191008, end_date=20221109T191010 +INFO - '2022-11-09' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-09' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-09' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskLoad airflow_run_id=manual__2022-11-09T19:09:54.391041+00:00 +INFO - '2022-11-09' - root - Found task metadata for operation TaskLoad: TaskMetadata(name='GBUNSalvador_dag_elt.TaskLoad', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskLoad', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskLoad', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskTransform'}, 'downstream_task_ids': set(), 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-09' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-09' - openlineage.client.transport.console - {"eventTime": "2022-11-09T19:10:10.759748Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1028508c-09c2-49af-a5ed-73cb2e5c5cc8"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27209\357\200\27254.391041+00\357\200\27200/task_id=TaskTransform/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27209\357\200\27254.391041+00\357\200\27200/task_id=TaskTransform/attempt=1.log" new file mode 100644 index 00000000..7b33ce2d --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27209\357\200\27254.391041+00\357\200\27200/task_id=TaskTransform/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-09T19:09:59.848956Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskLoad'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskExtract'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-09T19:09:54.391041Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "757b12ae-8a0e-3290-88f8-7f5acfa9e9ab"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "757b12ae-8a0e-3290-88f8-7f5acfa9e9ab"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "71455aac-9f6c-41ba-90c2-06e2f22adc71"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskTransform, dagrun_id=manual__2022-11-09T19:09:54.391041+00:00, map_index=-1, run_start_date=2022-11-09 19:09:59.848956+00:00, try_number=1, job_id=542, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-09 19:09:54.391041+00:00 +INFO - Started process 667 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskTransform', 'manual__2022-11-09T19:09:54.391041+00:00', '--job-id', '542', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmp8mjuv30b'] +INFO - Job 542: Subtask TaskTransform +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 03a0f0f60b55 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskTransform +AIRFLOW_CTX_EXECUTION_DATE=2022-11-09T19:09:54.391041+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-09T19:09:54.391041+00:00 +INFO - '2022-11-09' - GBUNSalvador_dag_elt - Transform +INFO - ['GBUNSalvador', 'select.csv'] +INFO - GBUNSalvador +INFO - GBUNSalvador_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskTransform, execution_date=20221109T190954, start_date=20221109T190959, end_date=20221109T191006 +INFO - '2022-11-09' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-09' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-09' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskTransform airflow_run_id=manual__2022-11-09T19:09:54.391041+00:00 +INFO - '2022-11-09' - root - Found task metadata for operation TaskTransform: TaskMetadata(name='GBUNSalvador_dag_elt.TaskTransform', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskTransform', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskTransform', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskExtract'}, 'downstream_task_ids': {'TaskLoad'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-09' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-09' - openlineage.client.transport.console - {"eventTime": "2022-11-09T19:10:06.626972Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "71455aac-9f6c-41ba-90c2-06e2f22adc71"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27212\357\200\27253.252347+00\357\200\27200/task_id=TaskExtract/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27212\357\200\27253.252347+00\357\200\27200/task_id=TaskExtract/attempt=1.log" new file mode 100644 index 00000000..115f45d5 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27212\357\200\27253.252347+00\357\200\27200/task_id=TaskExtract/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-09T19:12:54.444381Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-09T19:12:53.252347Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "e92a0f86-ff7b-336e-b524-1384efb4f316"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "e92a0f86-ff7b-336e-b524-1384efb4f316"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2be51493-939d-421d-9169-61966f6ce58b"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, dagrun_id=manual__2022-11-09T19:12:53.252347+00:00, map_index=-1, run_start_date=2022-11-09 19:12:54.444381+00:00, try_number=1, job_id=560, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-09 19:12:53.252347+00:00 +INFO - Started process 1071 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskExtract', 'manual__2022-11-09T19:12:53.252347+00:00', '--job-id', '560', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpsvbcg1hv'] +INFO - Job 560: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 03a0f0f60b55 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-09T19:12:53.252347+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-09T19:12:53.252347+00:00 +INFO - '2022-11-09' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-09' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-09' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-09' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-09' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-09' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, execution_date=20221109T191253, start_date=20221109T191254, end_date=20221109T191257 +INFO - '2022-11-09' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-09' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-09' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskExtract airflow_run_id=manual__2022-11-09T19:12:53.252347+00:00 +INFO - '2022-11-09' - root - Found task metadata for operation TaskExtract: TaskMetadata(name='GBUNSalvador_dag_elt.TaskExtract', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskExtract', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskExtract', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'TaskTransform'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-09' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-09' - openlineage.client.transport.console - {"eventTime": "2022-11-09T19:12:57.960786Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2be51493-939d-421d-9169-61966f6ce58b"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27212\357\200\27253.252347+00\357\200\27200/task_id=TaskLoad/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27212\357\200\27253.252347+00\357\200\27200/task_id=TaskLoad/attempt=1.log" new file mode 100644 index 00000000..ac3320f8 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27212\357\200\27253.252347+00\357\200\27200/task_id=TaskLoad/attempt=1.log" @@ -0,0 +1,123 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-09T19:13:04.233228Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-09T19:12:53.252347Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "e92a0f86-ff7b-336e-b524-1384efb4f316"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "e92a0f86-ff7b-336e-b524-1384efb4f316"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "010de873-59f9-4524-8bfa-c44f2070f238"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, dagrun_id=manual__2022-11-09T19:12:53.252347+00:00, map_index=-1, run_start_date=2022-11-09 19:13:04.233228+00:00, try_number=1, job_id=562, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-09 19:12:53.252347+00:00 +INFO - Started process 1081 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskLoad', 'manual__2022-11-09T19:12:53.252347+00:00', '--job-id', '562', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpkicu62d_'] +INFO - Job 562: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 03a0f0f60b55 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-09T19:12:53.252347+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-09T19:12:53.252347+00:00 +INFO - '2022-11-09' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-09' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-09' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-09' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-09' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-09' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-09' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-09' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-09' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-09' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f289e620e50> +INFO - '2022-11-09' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-09' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-09' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-09' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-09' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-09' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-09' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-09' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-09' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-09' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-09' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-09' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-09' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/preprocess/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '503Ir+z7OS2rrBvDN8vo9Q==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/preprocess/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-09' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/preprocess/GBUNSalvador_process.txt +INFO - '2022-11-09' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/preprocess/GBUNSalvador_process.txt +INFO - '2022-11-09' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-09' - botocore.auth - CanonicalRequest: +PUT +/preprocess/GBUNSalvador_process.txt + +content-md5:503Ir+z7OS2rrBvDN8vo9Q== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221109T191304Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-09' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221109T191304Z +20221109/us-east-1/s3/aws4_request +a6fbe81913138ee3fbc8ef8c05ce381caa573dda39b39961204ef58333cf0e8e +INFO - '2022-11-09' - botocore.auth - Signature: +d07adfdf02975d544b8b2a65b683084a603a81181b31790011cd76c0c3e826d5 +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.endpoint - Sending http request: +INFO - '2022-11-09' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-09' - urllib3.connectionpool - Starting new HTTPS connection (1): alkemy-2022-broc.s3.amazonaws.com:443 +INFO - '2022-11-09' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-09' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-09' - urllib3.connectionpool - https://alkemy-2022-broc.s3.amazonaws.com:443 "PUT /preprocess/GBUNSalvador_process.txt HTTP/1.1" 200 0 +INFO - '2022-11-09' - botocore.parsers - Response headers: {'x-amz-id-2': 'j2+jw+5h/NM0eWtv/pYAHmVBi0C1T0SARp7WXGCPVu0VJdihwVBqNnbR7xKpn6cjbaHiBCtoG9w=', 'x-amz-request-id': 'W5G2YM9TTA16GSRV', 'Date': 'Wed, 09 Nov 2022 19:13:03 GMT', 'ETag': '"e74dc8afecfb392dabac1bc337cbe8f5"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-09' - botocore.parsers - Response body: +b'' +INFO - '2022-11-09' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.retryhandler - No retry needed. +INFO - '2022-11-09' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-09' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, execution_date=20221109T191253, start_date=20221109T191304, end_date=20221109T191306 +INFO - '2022-11-09' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-09' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-09' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskLoad airflow_run_id=manual__2022-11-09T19:12:53.252347+00:00 +INFO - '2022-11-09' - root - Found task metadata for operation TaskLoad: TaskMetadata(name='GBUNSalvador_dag_elt.TaskLoad', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskLoad', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskLoad', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskTransform'}, 'downstream_task_ids': set(), 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-09' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-09' - openlineage.client.transport.console - {"eventTime": "2022-11-09T19:13:06.234469Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "010de873-59f9-4524-8bfa-c44f2070f238"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27212\357\200\27253.252347+00\357\200\27200/task_id=TaskTransform/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27212\357\200\27253.252347+00\357\200\27200/task_id=TaskTransform/attempt=1.log" new file mode 100644 index 00000000..32296dce --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27212\357\200\27253.252347+00\357\200\27200/task_id=TaskTransform/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-09T19:12:59.073725Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskLoad'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskExtract'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-09T19:12:53.252347Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "e92a0f86-ff7b-336e-b524-1384efb4f316"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "e92a0f86-ff7b-336e-b524-1384efb4f316"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "33f643bd-e1dd-4312-a69e-75d2dc5c4742"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskTransform, dagrun_id=manual__2022-11-09T19:12:53.252347+00:00, map_index=-1, run_start_date=2022-11-09 19:12:59.073725+00:00, try_number=1, job_id=561, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-09 19:12:53.252347+00:00 +INFO - Started process 1076 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskTransform', 'manual__2022-11-09T19:12:53.252347+00:00', '--job-id', '561', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpcwfzhh42'] +INFO - Job 561: Subtask TaskTransform +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 03a0f0f60b55 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskTransform +AIRFLOW_CTX_EXECUTION_DATE=2022-11-09T19:12:53.252347+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-09T19:12:53.252347+00:00 +INFO - '2022-11-09' - GBUNSalvador_dag_elt - Transform +INFO - ['GBUNSalvador', 'select.csv'] +INFO - GBUNSalvador +INFO - GBUNSalvador_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskTransform, execution_date=20221109T191253, start_date=20221109T191259, end_date=20221109T191303 +INFO - '2022-11-09' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-09' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-09' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskTransform airflow_run_id=manual__2022-11-09T19:12:53.252347+00:00 +INFO - '2022-11-09' - root - Found task metadata for operation TaskTransform: TaskMetadata(name='GBUNSalvador_dag_elt.TaskTransform', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskTransform', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskTransform', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskExtract'}, 'downstream_task_ids': {'TaskLoad'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-09' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-09' - openlineage.client.transport.console - {"eventTime": "2022-11-09T19:13:03.784526Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "33f643bd-e1dd-4312-a69e-75d2dc5c4742"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27221\357\200\27248.052338+00\357\200\27200/task_id=TaskExtract/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27221\357\200\27248.052338+00\357\200\27200/task_id=TaskExtract/attempt=1.log" new file mode 100644 index 00000000..ff6d3686 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27221\357\200\27248.052338+00\357\200\27200/task_id=TaskExtract/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-09T19:21:49.504365Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-09T19:21:48.052338Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "797cf908-40a8-3c6b-9252-79667fbc5fc6"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "797cf908-40a8-3c6b-9252-79667fbc5fc6"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2bda5d62-db39-481c-a387-d6b9342380e5"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, dagrun_id=manual__2022-11-09T19:21:48.052338+00:00, map_index=-1, run_start_date=2022-11-09 19:21:49.504365+00:00, try_number=1, job_id=566, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-09 19:21:48.052338+00:00 +INFO - Started process 1965 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskExtract', 'manual__2022-11-09T19:21:48.052338+00:00', '--job-id', '566', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmp4bc7ibwb'] +INFO - Job 566: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 03a0f0f60b55 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-09T19:21:48.052338+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-09T19:21:48.052338+00:00 +INFO - '2022-11-09' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-09' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-09' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-09' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-09' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-09' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, execution_date=20221109T192148, start_date=20221109T192149, end_date=20221109T192152 +INFO - '2022-11-09' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-09' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-09' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskExtract airflow_run_id=manual__2022-11-09T19:21:48.052338+00:00 +INFO - '2022-11-09' - root - Found task metadata for operation TaskExtract: TaskMetadata(name='GBUNSalvador_dag_elt.TaskExtract', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskExtract', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskExtract', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'TaskTransform'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-09' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-09' - openlineage.client.transport.console - {"eventTime": "2022-11-09T19:21:52.739840Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2bda5d62-db39-481c-a387-d6b9342380e5"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27221\357\200\27248.052338+00\357\200\27200/task_id=TaskLoad/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27221\357\200\27248.052338+00\357\200\27200/task_id=TaskLoad/attempt=1.log" new file mode 100644 index 00000000..a28110a1 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27221\357\200\27248.052338+00\357\200\27200/task_id=TaskLoad/attempt=1.log" @@ -0,0 +1,123 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-09T19:21:58.830444Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-09T19:21:48.052338Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "797cf908-40a8-3c6b-9252-79667fbc5fc6"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "797cf908-40a8-3c6b-9252-79667fbc5fc6"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3b0bbdad-da39-40e8-a371-38854ff91efc"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, dagrun_id=manual__2022-11-09T19:21:48.052338+00:00, map_index=-1, run_start_date=2022-11-09 19:21:58.830444+00:00, try_number=1, job_id=568, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-09 19:21:48.052338+00:00 +INFO - Started process 1975 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskLoad', 'manual__2022-11-09T19:21:48.052338+00:00', '--job-id', '568', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpizorhkih'] +INFO - Job 568: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 03a0f0f60b55 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-09T19:21:48.052338+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-09T19:21:48.052338+00:00 +INFO - '2022-11-09' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-09' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-09' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-09' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-09' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-09' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-09' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-09' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-09' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-09' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-09' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f289e61ce50> +INFO - '2022-11-09' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-09' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-09' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-09' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-09' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-09' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-09' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-09' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-09' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-09' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-09' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-09' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-09' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-09' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'preprocess/GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/preprocess/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'iKkfMCqUD5aIGz7i6VoU/g==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/preprocess/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-09' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-09' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/preprocess/GBUNSalvador_process.txt +INFO - '2022-11-09' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/preprocess/GBUNSalvador_process.txt +INFO - '2022-11-09' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-09' - botocore.auth - CanonicalRequest: +PUT +/preprocess/GBUNSalvador_process.txt + +content-md5:iKkfMCqUD5aIGz7i6VoU/g== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221109T192159Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-09' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221109T192159Z +20221109/us-east-1/s3/aws4_request +15b37fb60970cd30a27f284e7257c80b9d4c7ce011ef11b4b07c19e439dd3a2a +INFO - '2022-11-09' - botocore.auth - Signature: +51a35e00448e02c5c99bdc1349465850ff37e15cea8ab90bf2ad0103ed605e06 +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.endpoint - Sending http request: +INFO - '2022-11-09' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-09' - urllib3.connectionpool - Starting new HTTPS connection (1): alkemy-2022-broc.s3.amazonaws.com:443 +INFO - '2022-11-09' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-09' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-09' - urllib3.connectionpool - https://alkemy-2022-broc.s3.amazonaws.com:443 "PUT /preprocess/GBUNSalvador_process.txt HTTP/1.1" 200 0 +INFO - '2022-11-09' - botocore.parsers - Response headers: {'x-amz-id-2': 'o5Y8A3tzgpFx8rCXJxxN1uKeGQ3mbrimc4Fj99Ci7qV1SIUY+aKMUfcnuF+uwsvR+oNIP/Yoqak=', 'x-amz-request-id': '7ZWTHGFHRPFRG95C', 'Date': 'Wed, 09 Nov 2022 19:21:58 GMT', 'ETag': '"88a91f302a940f96881b3ee2e95a14fe"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-09' - botocore.parsers - Response body: +b'' +INFO - '2022-11-09' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-09' - botocore.retryhandler - No retry needed. +INFO - '2022-11-09' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-09' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, execution_date=20221109T192148, start_date=20221109T192158, end_date=20221109T192200 +INFO - '2022-11-09' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-09' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-09' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskLoad airflow_run_id=manual__2022-11-09T19:21:48.052338+00:00 +INFO - '2022-11-09' - root - Found task metadata for operation TaskLoad: TaskMetadata(name='GBUNSalvador_dag_elt.TaskLoad', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskLoad', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskLoad', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskTransform'}, 'downstream_task_ids': set(), 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-09' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-09' - openlineage.client.transport.console - {"eventTime": "2022-11-09T19:22:00.912097Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3b0bbdad-da39-40e8-a371-38854ff91efc"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27221\357\200\27248.052338+00\357\200\27200/task_id=TaskTransform/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27221\357\200\27248.052338+00\357\200\27200/task_id=TaskTransform/attempt=1.log" new file mode 100644 index 00000000..546c6577 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-09T19\357\200\27221\357\200\27248.052338+00\357\200\27200/task_id=TaskTransform/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-09T19:21:53.682793Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskLoad'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskExtract'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-09T19:21:48.052338Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "797cf908-40a8-3c6b-9252-79667fbc5fc6"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "797cf908-40a8-3c6b-9252-79667fbc5fc6"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e10b8c8d-cecc-4a83-9c7d-27080e85ade5"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskTransform, dagrun_id=manual__2022-11-09T19:21:48.052338+00:00, map_index=-1, run_start_date=2022-11-09 19:21:53.682793+00:00, try_number=1, job_id=567, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-09 19:21:48.052338+00:00 +INFO - Started process 1970 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskTransform', 'manual__2022-11-09T19:21:48.052338+00:00', '--job-id', '567', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpztato0yd'] +INFO - Job 567: Subtask TaskTransform +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 03a0f0f60b55 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskTransform +AIRFLOW_CTX_EXECUTION_DATE=2022-11-09T19:21:48.052338+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-09T19:21:48.052338+00:00 +INFO - '2022-11-09' - GBUNSalvador_dag_elt - Transform +INFO - ['GBUNSalvador', 'select.csv'] +INFO - GBUNSalvador +INFO - GBUNSalvador_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskTransform, execution_date=20221109T192148, start_date=20221109T192153, end_date=20221109T192158 +INFO - '2022-11-09' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-09' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-09' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskTransform airflow_run_id=manual__2022-11-09T19:21:48.052338+00:00 +INFO - '2022-11-09' - root - Found task metadata for operation TaskTransform: TaskMetadata(name='GBUNSalvador_dag_elt.TaskTransform', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskTransform', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskTransform', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskExtract'}, 'downstream_task_ids': {'TaskLoad'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-09' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-09' - openlineage.client.transport.console - {"eventTime": "2022-11-09T19:21:58.296756Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e10b8c8d-cecc-4a83-9c7d-27080e85ade5"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T06\357\200\27213\357\200\27219.477101+00\357\200\27200/task_id=TaskExtract/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T06\357\200\27213\357\200\27219.477101+00\357\200\27200/task_id=TaskExtract/attempt=1.log" new file mode 100644 index 00000000..19f80a9d --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T06\357\200\27213\357\200\27219.477101+00\357\200\27200/task_id=TaskExtract/attempt=1.log" @@ -0,0 +1,51 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:13:21.041134Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "_TaskDecorator(function=, operator_class=, multiple_outputs=False, kwargs={'task_id': 'extract'})", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "_TaskDecorator(function=, operator_class=, multiple_outputs=False, kwargs={'task_id': 'extract'})", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T06:13:19.477101Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "79a584f5-3d52-3549-9ce2-e0b739f053c6"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "79a584f5-3d52-3549-9ce2-e0b739f053c6"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": {"decorator_name": "task", "function": "<>", "kwargs": {"task_id": "extract"}, "multiple_outputs": false, "operator_class": "<>"}, "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": {"decorator_name": "task", "function": "<>", "kwargs": {"task_id": "extract"}, "multiple_outputs": false, "operator_class": "<>"}, "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e7848b4b-ede5-4216-aeaa-045677b67e34"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, dagrun_id=manual__2022-11-10T06:13:19.477101+00:00, map_index=-1, run_start_date=2022-11-10 06:13:21.041134+00:00, try_number=1, job_id=581, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 06:13:19.477101+00:00 +INFO - Started process 1615 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskExtract', 'manual__2022-11-10T06:13:19.477101+00:00', '--job-id', '581', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpw8xsdzlf'] +INFO - Job 581: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T06:13:19.477101+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T06:13:19.477101+00:00 +INFO - Done. Returned value was: {{ task_instance.xcom_pull(task_ids='extract', dag_id='adhoc_airflow', key='return_value') }} +ERROR - Could not serialize the XCom value into JSON. If you are using pickle instead of JSON for XCom, then you need to enable pickle support for XCom in your airflow config. +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/utils/session.py", line 72, in wrapper + return func(*args, **kwargs) + File "/usr/local/lib/python3.9/site-packages/airflow/models/taskinstance.py", line 2378, in xcom_push + XCom.set( + File "/usr/local/lib/python3.9/site-packages/airflow/utils/session.py", line 72, in wrapper + return func(*args, **kwargs) + File "/usr/local/lib/python3.9/site-packages/airflow/models/xcom.py", line 206, in set + value = cls.serialize_value( + File "/usr/local/lib/python3.9/site-packages/airflow/models/xcom.py", line 597, in serialize_value + return json.dumps(value).encode('UTF-8') + File "/usr/local/lib/python3.9/json/__init__.py", line 231, in dumps + return _default_encoder.encode(obj) + File "/usr/local/lib/python3.9/json/encoder.py", line 199, in encode + chunks = self.iterencode(o, _one_shot=True) + File "/usr/local/lib/python3.9/json/encoder.py", line 257, in iterencode + return _iterencode(o, 0) + File "/usr/local/lib/python3.9/json/encoder.py", line 179, in default + raise TypeError(f'Object of type {o.__class__.__name__} ' +TypeError: Object of type PlainXComArg is not JSON serializable +INFO - Marking task as UP_FOR_RETRY. dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, execution_date=20221110T061319, start_date=20221110T061321, end_date=20221110T061321 +ERROR - Failed to execute job 581 for task TaskExtract (Object of type PlainXComArg is not JSON serializable; 1615) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T06\357\200\27213\357\200\27219.477101+00\357\200\27200/task_id=TaskExtract/attempt=2.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T06\357\200\27213\357\200\27219.477101+00\357\200\27200/task_id=TaskExtract/attempt=2.log" new file mode 100644 index 00000000..5ad48eee --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T06\357\200\27213\357\200\27219.477101+00\357\200\27200/task_id=TaskExtract/attempt=2.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 2 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:23:23.234398Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T06:13:19.477101Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "79a584f5-3d52-3549-9ce2-e0b739f053c6"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "79a584f5-3d52-3549-9ce2-e0b739f053c6"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2556c8ce-f423-4c0b-a502-9eb8d70b6596"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, dagrun_id=manual__2022-11-10T06:13:19.477101+00:00, map_index=-1, run_start_date=2022-11-10 06:23:23.234398+00:00, try_number=2, job_id=599, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 06:13:19.477101+00:00 +INFO - Started process 2654 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskExtract', 'manual__2022-11-10T06:13:19.477101+00:00', '--job-id', '599', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmprorqna7h'] +INFO - Job 599: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T06:13:19.477101+00:00 +AIRFLOW_CTX_TRY_NUMBER=2 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T06:13:19.477101+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-10' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, execution_date=20221110T061319, start_date=20221110T062323, end_date=20221110T062326 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskExtract airflow_run_id=manual__2022-11-10T06:13:19.477101+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskExtract: TaskMetadata(name='GBUNSalvador_dag_elt.TaskExtract', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskExtract', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskExtract', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'TaskTransform'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T06:23:26.511809Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "2556c8ce-f423-4c0b-a502-9eb8d70b6596"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T06\357\200\27213\357\200\27219.477101+00\357\200\27200/task_id=TaskLoad/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T06\357\200\27213\357\200\27219.477101+00\357\200\27200/task_id=TaskLoad/attempt=1.log" new file mode 100644 index 00000000..8dbf0a73 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T06\357\200\27213\357\200\27219.477101+00\357\200\27200/task_id=TaskLoad/attempt=1.log" @@ -0,0 +1,124 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:23:32.604688Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T06:13:19.477101Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "79a584f5-3d52-3549-9ce2-e0b739f053c6"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "79a584f5-3d52-3549-9ce2-e0b739f053c6"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0d05cf6a-d015-4211-ac6f-86ba3c7a944d"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, dagrun_id=manual__2022-11-10T06:13:19.477101+00:00, map_index=-1, run_start_date=2022-11-10 06:23:32.604688+00:00, try_number=1, job_id=602, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 06:13:19.477101+00:00 +INFO - Started process 2702 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskLoad', 'manual__2022-11-10T06:13:19.477101+00:00', '--job-id', '602', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpft8k8ll8'] +INFO - Job 602: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T06:13:19.477101+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T06:13:19.477101+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-10' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-10' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fcc542838b0> +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-10' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-10' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/dipa-s3/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'N6V18ZBB5L+/Ym0KCsbx3Q==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/dipa-s3/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'dipa-s3'}}} +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-10' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/dipa-s3/GBUNSalvador_process.txt +INFO - '2022-11-10' - botocore.utils - URI updated to: https://dipa-s3.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-10' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-10' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:N6V18ZBB5L+/Ym0KCsbx3Q== +host:dipa-s3.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221110T062333Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-10' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221110T062333Z +20221110/us-east-1/s3/aws4_request +130acf3f59fac28373d69bfa2811504c066d623a071fe74a8012263f2dd99480 +INFO - '2022-11-10' - botocore.auth - Signature: +abaafc16c78f783b9a0049bf42590791869b2b256b5982936712fea935d75621 +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Sending http request: +INFO - '2022-11-10' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTPS connection (1): dipa-s3.s3.amazonaws.com:443 +INFO - '2022-11-10' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-10' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-10' - urllib3.connectionpool - https://dipa-s3.s3.amazonaws.com:443 "PUT /GBUNSalvador_process.txt HTTP/1.1" 200 0 +INFO - '2022-11-10' - botocore.parsers - Response headers: {'x-amz-id-2': 'YY0lCe3ifllCDP0ajdVqYSmTTtYi3kcBSM+gjcbaIJBWfgTDyMtZ5n24IA1+vBCjmoulcISKgPk=', 'x-amz-request-id': 'XFKJPHCJ37GYJ5N2', 'Date': 'Thu, 10 Nov 2022 06:23:33 GMT', 'ETag': '"37a575f19041e4bfbf626d0a0ac6f1dd"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-10' - botocore.parsers - Response body: +b'' +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.retryhandler - No retry needed. +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, execution_date=20221110T061319, start_date=20221110T062332, end_date=20221110T062334 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskLoad airflow_run_id=manual__2022-11-10T06:13:19.477101+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskLoad: TaskMetadata(name='GBUNSalvador_dag_elt.TaskLoad', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskLoad', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskLoad', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskTransform'}, 'downstream_task_ids': set(), 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T06:23:34.953967Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0d05cf6a-d015-4211-ac6f-86ba3c7a944d"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T06\357\200\27213\357\200\27219.477101+00\357\200\27200/task_id=TaskTransform/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T06\357\200\27213\357\200\27219.477101+00\357\200\27200/task_id=TaskTransform/attempt=1.log" new file mode 100644 index 00000000..91c0f018 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T06\357\200\27213\357\200\27219.477101+00\357\200\27200/task_id=TaskTransform/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:23:27.607932Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskLoad'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskExtract'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T06:13:19.477101Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "79a584f5-3d52-3549-9ce2-e0b739f053c6"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "79a584f5-3d52-3549-9ce2-e0b739f053c6"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0bd42518-e97d-4a7a-82fc-ba3b8a024343"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskTransform, dagrun_id=manual__2022-11-10T06:13:19.477101+00:00, map_index=-1, run_start_date=2022-11-10 06:23:27.607932+00:00, try_number=1, job_id=600, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 06:13:19.477101+00:00 +INFO - Started process 2677 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskTransform', 'manual__2022-11-10T06:13:19.477101+00:00', '--job-id', '600', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpkqu3v0jg'] +INFO - Job 600: Subtask TaskTransform +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskTransform +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T06:13:19.477101+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T06:13:19.477101+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Transform +INFO - ['GBUNSalvador', 'select.csv'] +INFO - GBUNSalvador +INFO - GBUNSalvador_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskTransform, execution_date=20221110T061319, start_date=20221110T062327, end_date=20221110T062331 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskTransform airflow_run_id=manual__2022-11-10T06:13:19.477101+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskTransform: TaskMetadata(name='GBUNSalvador_dag_elt.TaskTransform', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskTransform', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskTransform', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskExtract'}, 'downstream_task_ids': {'TaskLoad'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T06:23:31.862844Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0bd42518-e97d-4a7a-82fc-ba3b8a024343"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T06\357\200\27218\357\200\27208.895608+00\357\200\27200/task_id=TaskExtract/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T06\357\200\27218\357\200\27208.895608+00\357\200\27200/task_id=TaskExtract/attempt=1.log" new file mode 100644 index 00000000..6456f094 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T06\357\200\27218\357\200\27208.895608+00\357\200\27200/task_id=TaskExtract/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:18:10.388370Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T06:18:08.895608Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "c23727d7-25ed-3ef2-af23-5b40af90fd5f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "c23727d7-25ed-3ef2-af23-5b40af90fd5f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "93ce3933-ba2c-4df8-abd6-d01f1ad77efa"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, dagrun_id=manual__2022-11-10T06:18:08.895608+00:00, map_index=-1, run_start_date=2022-11-10 06:18:10.388370+00:00, try_number=1, job_id=586, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 06:18:08.895608+00:00 +INFO - Started process 2082 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskExtract', 'manual__2022-11-10T06:18:08.895608+00:00', '--job-id', '586', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpdptgg3xz'] +INFO - Job 586: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T06:18:08.895608+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T06:18:08.895608+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-10' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, execution_date=20221110T061808, start_date=20221110T061810, end_date=20221110T061813 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskExtract airflow_run_id=manual__2022-11-10T06:18:08.895608+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskExtract: TaskMetadata(name='GBUNSalvador_dag_elt.TaskExtract', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskExtract', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskExtract', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'TaskTransform'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T06:18:13.642315Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "93ce3933-ba2c-4df8-abd6-d01f1ad77efa"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T06\357\200\27218\357\200\27208.895608+00\357\200\27200/task_id=TaskLoad/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T06\357\200\27218\357\200\27208.895608+00\357\200\27200/task_id=TaskLoad/attempt=1.log" new file mode 100644 index 00000000..2fb29fb3 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T06\357\200\27218\357\200\27208.895608+00\357\200\27200/task_id=TaskLoad/attempt=1.log" @@ -0,0 +1,124 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:18:18.346996Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T06:18:08.895608Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "c23727d7-25ed-3ef2-af23-5b40af90fd5f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "c23727d7-25ed-3ef2-af23-5b40af90fd5f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d7d196a5-4604-434d-b726-91f451f5119e"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, dagrun_id=manual__2022-11-10T06:18:08.895608+00:00, map_index=-1, run_start_date=2022-11-10 06:18:18.346996+00:00, try_number=1, job_id=588, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 06:18:08.895608+00:00 +INFO - Started process 2092 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskLoad', 'manual__2022-11-10T06:18:08.895608+00:00', '--job-id', '588', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpkdyjflar'] +INFO - Job 588: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T06:18:08.895608+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T06:18:08.895608+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-10' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-10' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fcc542848b0> +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-10' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-10' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/dipa-s3/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'I4AB+YNwMbOb86U+l+69Sw==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/dipa-s3/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'dipa-s3'}}} +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-10' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/dipa-s3/GBUNSalvador_process.txt +INFO - '2022-11-10' - botocore.utils - URI updated to: https://dipa-s3.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-10' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-10' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:I4AB+YNwMbOb86U+l+69Sw== +host:dipa-s3.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221110T061818Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-10' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221110T061818Z +20221110/us-east-1/s3/aws4_request +96b627208cfa39824e2f217020b327d4af030dcfd149518f38a3cde6529f7b02 +INFO - '2022-11-10' - botocore.auth - Signature: +7d9e3f659cf7f6f9dea3a8ecb7e5f2b7f1c7f73e98b139a8a3916225eb611957 +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Sending http request: +INFO - '2022-11-10' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTPS connection (1): dipa-s3.s3.amazonaws.com:443 +INFO - '2022-11-10' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-10' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-10' - urllib3.connectionpool - https://dipa-s3.s3.amazonaws.com:443 "PUT /GBUNSalvador_process.txt HTTP/1.1" 200 0 +INFO - '2022-11-10' - botocore.parsers - Response headers: {'x-amz-id-2': 'Q1ceoOXzrSQL4IZuEXLvQoxgElTkcQb1XAYawSoaJ6zwvnw2cqzZhwnptmdbz+cdrx1EOz92eLM=', 'x-amz-request-id': '4RX4RGDXXA0KH7E5', 'Date': 'Thu, 10 Nov 2022 06:18:19 GMT', 'ETag': '"238001f9837031b39bf3a53e97eebd4b"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-10' - botocore.parsers - Response body: +b'' +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.retryhandler - No retry needed. +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, execution_date=20221110T061808, start_date=20221110T061818, end_date=20221110T061820 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskLoad airflow_run_id=manual__2022-11-10T06:18:08.895608+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskLoad: TaskMetadata(name='GBUNSalvador_dag_elt.TaskLoad', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskLoad', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskLoad', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskTransform'}, 'downstream_task_ids': set(), 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T06:18:20.784387Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d7d196a5-4604-434d-b726-91f451f5119e"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T06\357\200\27218\357\200\27208.895608+00\357\200\27200/task_id=TaskTransform/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T06\357\200\27218\357\200\27208.895608+00\357\200\27200/task_id=TaskTransform/attempt=1.log" new file mode 100644 index 00000000..ade3ac37 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T06\357\200\27218\357\200\27208.895608+00\357\200\27200/task_id=TaskTransform/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:18:14.326600Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskLoad'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskExtract'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T06:18:08.895608Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "c23727d7-25ed-3ef2-af23-5b40af90fd5f"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "c23727d7-25ed-3ef2-af23-5b40af90fd5f"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f0d9854f-2a8d-4c8e-9997-edea94fafcba"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskTransform, dagrun_id=manual__2022-11-10T06:18:08.895608+00:00, map_index=-1, run_start_date=2022-11-10 06:18:14.326600+00:00, try_number=1, job_id=587, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 06:18:08.895608+00:00 +INFO - Started process 2087 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskTransform', 'manual__2022-11-10T06:18:08.895608+00:00', '--job-id', '587', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmp25a6ext0'] +INFO - Job 587: Subtask TaskTransform +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskTransform +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T06:18:08.895608+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T06:18:08.895608+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Transform +INFO - ['GBUNSalvador', 'select.csv'] +INFO - GBUNSalvador +INFO - GBUNSalvador_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskTransform, execution_date=20221110T061808, start_date=20221110T061814, end_date=20221110T061817 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskTransform airflow_run_id=manual__2022-11-10T06:18:08.895608+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskTransform: TaskMetadata(name='GBUNSalvador_dag_elt.TaskTransform', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskTransform', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskTransform', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskExtract'}, 'downstream_task_ids': {'TaskLoad'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T06:18:17.787969Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f0d9854f-2a8d-4c8e-9997-edea94fafcba"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T06\357\200\27239\357\200\27229.484119+00\357\200\27200/task_id=TaskExtract/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T06\357\200\27239\357\200\27229.484119+00\357\200\27200/task_id=TaskExtract/attempt=1.log" new file mode 100644 index 00000000..183fbd51 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T06\357\200\27239\357\200\27229.484119+00\357\200\27200/task_id=TaskExtract/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:39:30.225803Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T06:39:29.484119Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "d5d27e25-e201-356d-a3bd-c43e8b14ac3e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "d5d27e25-e201-356d-a3bd-c43e8b14ac3e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d9144b4a-f816-48c1-9cb9-ea812b582180"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, dagrun_id=manual__2022-11-10T06:39:29.484119+00:00, map_index=-1, run_start_date=2022-11-10 06:39:30.225803+00:00, try_number=1, job_id=607, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 06:39:29.484119+00:00 +INFO - Started process 4301 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskExtract', 'manual__2022-11-10T06:39:29.484119+00:00', '--job-id', '607', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpt8d2pe_m'] +INFO - Job 607: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T06:39:29.484119+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T06:39:29.484119+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-10' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, execution_date=20221110T063929, start_date=20221110T063930, end_date=20221110T063933 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskExtract airflow_run_id=manual__2022-11-10T06:39:29.484119+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskExtract: TaskMetadata(name='GBUNSalvador_dag_elt.TaskExtract', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskExtract', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskExtract', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'TaskTransform'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T06:39:33.700085Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d9144b4a-f816-48c1-9cb9-ea812b582180"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T06\357\200\27239\357\200\27229.484119+00\357\200\27200/task_id=TaskLoad/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T06\357\200\27239\357\200\27229.484119+00\357\200\27200/task_id=TaskLoad/attempt=1.log" new file mode 100644 index 00000000..d8a31ec3 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T06\357\200\27239\357\200\27229.484119+00\357\200\27200/task_id=TaskLoad/attempt=1.log" @@ -0,0 +1,124 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:39:40.042610Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T06:39:29.484119Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "d5d27e25-e201-356d-a3bd-c43e8b14ac3e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "d5d27e25-e201-356d-a3bd-c43e8b14ac3e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1395f783-732e-439e-802e-8bac86f343d7"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, dagrun_id=manual__2022-11-10T06:39:29.484119+00:00, map_index=-1, run_start_date=2022-11-10 06:39:40.042610+00:00, try_number=1, job_id=609, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 06:39:29.484119+00:00 +INFO - Started process 4311 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskLoad', 'manual__2022-11-10T06:39:29.484119+00:00', '--job-id', '609', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmp0g4i2gyj'] +INFO - Job 609: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T06:39:29.484119+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T06:39:29.484119+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-10' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-10' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fcc54276700> +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-10' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-10' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/dipa-s3/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'VVGdcOYE/N0j8lB/9DkvHw==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/dipa-s3/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'dipa-s3'}}} +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-10' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/dipa-s3/GBUNSalvador_process.txt +INFO - '2022-11-10' - botocore.utils - URI updated to: https://dipa-s3.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-10' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-10' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:VVGdcOYE/N0j8lB/9DkvHw== +host:dipa-s3.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221110T063940Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-10' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221110T063940Z +20221110/us-east-1/s3/aws4_request +92e3660b118e1efaaed7aaeb8ac6c7f5b8a7d35b46755dc996bc33cffad20fd7 +INFO - '2022-11-10' - botocore.auth - Signature: +1ae91ea0cce6926b8f70c08a224ba24cd6f397032107cdb6420e5bf2e0abe162 +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Sending http request: +INFO - '2022-11-10' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTPS connection (1): dipa-s3.s3.amazonaws.com:443 +INFO - '2022-11-10' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-10' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-10' - urllib3.connectionpool - https://dipa-s3.s3.amazonaws.com:443 "PUT /GBUNSalvador_process.txt HTTP/1.1" 200 0 +INFO - '2022-11-10' - botocore.parsers - Response headers: {'x-amz-id-2': '7LUS8rgUuA9ibgeYNN5cJRVKV/L4y2wM7GqRfI4wVbI5/k0bUft9SOTHOfYMW0kk9F7Xk9njBsU=', 'x-amz-request-id': 'E4Z80DSKPD7GYBCC', 'Date': 'Thu, 10 Nov 2022 06:39:41 GMT', 'ETag': '"55519d70e604fcdd23f2507ff4392f1f"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-10' - botocore.parsers - Response body: +b'' +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.retryhandler - No retry needed. +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, execution_date=20221110T063929, start_date=20221110T063940, end_date=20221110T063942 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskLoad airflow_run_id=manual__2022-11-10T06:39:29.484119+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskLoad: TaskMetadata(name='GBUNSalvador_dag_elt.TaskLoad', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskLoad', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskLoad', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskTransform'}, 'downstream_task_ids': set(), 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T06:39:42.137035Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "1395f783-732e-439e-802e-8bac86f343d7"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T06\357\200\27239\357\200\27229.484119+00\357\200\27200/task_id=TaskTransform/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T06\357\200\27239\357\200\27229.484119+00\357\200\27200/task_id=TaskTransform/attempt=1.log" new file mode 100644 index 00000000..47c1b306 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T06\357\200\27239\357\200\27229.484119+00\357\200\27200/task_id=TaskTransform/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:39:35.040987Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskLoad'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskExtract'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T06:39:29.484119Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "d5d27e25-e201-356d-a3bd-c43e8b14ac3e"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "d5d27e25-e201-356d-a3bd-c43e8b14ac3e"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "21f6a891-4eb7-4ece-a135-216db7248253"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskTransform, dagrun_id=manual__2022-11-10T06:39:29.484119+00:00, map_index=-1, run_start_date=2022-11-10 06:39:35.040987+00:00, try_number=1, job_id=608, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 06:39:29.484119+00:00 +INFO - Started process 4306 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskTransform', 'manual__2022-11-10T06:39:29.484119+00:00', '--job-id', '608', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpug2xvi80'] +INFO - Job 608: Subtask TaskTransform +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskTransform +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T06:39:29.484119+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T06:39:29.484119+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Transform +INFO - ['GBUNSalvador', 'select.csv'] +INFO - GBUNSalvador +INFO - GBUNSalvador_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskTransform, execution_date=20221110T063929, start_date=20221110T063935, end_date=20221110T063939 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskTransform airflow_run_id=manual__2022-11-10T06:39:29.484119+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskTransform: TaskMetadata(name='GBUNSalvador_dag_elt.TaskTransform', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskTransform', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskTransform', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskExtract'}, 'downstream_task_ids': {'TaskLoad'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T06:39:39.377240Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "21f6a891-4eb7-4ece-a135-216db7248253"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27203\357\200\27256.245412+00\357\200\27200/task_id=TaskExtract/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27203\357\200\27256.245412+00\357\200\27200/task_id=TaskExtract/attempt=1.log" new file mode 100644 index 00000000..fd3dd2a5 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27203\357\200\27256.245412+00\357\200\27200/task_id=TaskExtract/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T11:03:58.355393Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T11:03:56.245412Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "41c614bd-d7d6-379e-907a-636e84057a81"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "41c614bd-d7d6-379e-907a-636e84057a81"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7e83bac2-0de8-4dd5-a591-c39ce4d61848"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, dagrun_id=manual__2022-11-10T11:03:56.245412+00:00, map_index=-1, run_start_date=2022-11-10 11:03:58.355393+00:00, try_number=1, job_id=2984, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 11:03:56.245412+00:00 +INFO - Started process 2138 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskExtract', 'manual__2022-11-10T11:03:56.245412+00:00', '--job-id', '2984', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmp6z3vk2iw'] +INFO - Job 2984: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host d1b6a3478c83 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T11:03:56.245412+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T11:03:56.245412+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNSalvador_dag_elt.py", line 52, in extract + conn = hook.get_conn() + File "/usr/local/lib/python3.9/site-packages/airflow/providers/postgres/hooks/postgres.py", line 115, in get_conn + self.conn = psycopg2.connect(**conn_args) + File "/usr/local/lib/python3.9/site-packages/psycopg2/__init__.py", line 122, in connect + conn = _connect(dsn, connection_factory=connection_factory, **kwasync) +psycopg2.OperationalError: could not translate host name "training-main.cghe7e6sfljt.us-east-1.rds.amazonaws.com" to address: Temporary failure in name resolution + +INFO - Marking task as UP_FOR_RETRY. dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, execution_date=20221110T110356, start_date=20221110T110358, end_date=20221110T110409 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 2984 for task TaskExtract (could not translate host name "training-main.cghe7e6sfljt.us-east-1.rds.amazonaws.com" to address: Temporary failure in name resolution +; 2138) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27203\357\200\27256.245412+00\357\200\27200/task_id=TaskExtract/attempt=2.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27203\357\200\27256.245412+00\357\200\27200/task_id=TaskExtract/attempt=2.log" new file mode 100644 index 00000000..f73c2fb2 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27203\357\200\27256.245412+00\357\200\27200/task_id=TaskExtract/attempt=2.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 2 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T11:14:10.784614Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T11:03:56.245412Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "41c614bd-d7d6-379e-907a-636e84057a81"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "41c614bd-d7d6-379e-907a-636e84057a81"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7fb9097e-2f92-41e3-8cfa-644a8d98b7e5"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, dagrun_id=manual__2022-11-10T11:03:56.245412+00:00, map_index=-1, run_start_date=2022-11-10 11:14:10.784614+00:00, try_number=2, job_id=2990, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 11:03:56.245412+00:00 +INFO - Started process 2229 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskExtract', 'manual__2022-11-10T11:03:56.245412+00:00', '--job-id', '2990', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmppux72m8z'] +INFO - Job 2990: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host d1b6a3478c83 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T11:03:56.245412+00:00 +AIRFLOW_CTX_TRY_NUMBER=2 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T11:03:56.245412+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-10' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, execution_date=20221110T110356, start_date=20221110T111410, end_date=20221110T111414 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskExtract airflow_run_id=manual__2022-11-10T11:03:56.245412+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskExtract: TaskMetadata(name='GBUNSalvador_dag_elt.TaskExtract', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskExtract', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskExtract', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'TaskTransform'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T11:14:14.796007Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7fb9097e-2f92-41e3-8cfa-644a8d98b7e5"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27203\357\200\27256.245412+00\357\200\27200/task_id=TaskLoad/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27203\357\200\27256.245412+00\357\200\27200/task_id=TaskLoad/attempt=1.log" new file mode 100644 index 00000000..58fe88d9 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27203\357\200\27256.245412+00\357\200\27200/task_id=TaskLoad/attempt=1.log" @@ -0,0 +1,291 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T11:14:25.237559Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T11:03:56.245412Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "41c614bd-d7d6-379e-907a-636e84057a81"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "41c614bd-d7d6-379e-907a-636e84057a81"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "45fed7d3-d209-4856-8aa5-63a66da1bfa4"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, dagrun_id=manual__2022-11-10T11:03:56.245412+00:00, map_index=-1, run_start_date=2022-11-10 11:14:25.237559+00:00, try_number=1, job_id=2993, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 11:03:56.245412+00:00 +INFO - Started process 2243 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskLoad', 'manual__2022-11-10T11:03:56.245412+00:00', '--job-id', '2993', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpz32n_n6n'] +INFO - Job 2993: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host d1b6a3478c83 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T11:03:56.245412+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T11:03:56.245412+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-10' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-10' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTP connection (1): 169.254.169.254:80 +INFO - '2022-11-10' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTP connection (2): 169.254.169.254:80 +INFO - '2022-11-10' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-10' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-10' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f228ee5e700> +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-10' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-10' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/dipa-s3/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '5tSMZQaqcrCzCddBSibreQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/dipa-s3/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'dipa-s3'}}} +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-10' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/dipa-s3/GBUNSalvador_process.txt +INFO - '2022-11-10' - botocore.utils - URI updated to: https://dipa-s3.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-10' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 898, in _make_api_call + http, parsed_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 921, in _make_request + return self._endpoint.make_request(operation_model, request_dict) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 119, in make_request + return self._send_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 198, in _send_request + request = self.create_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 134, in create_request + self._event_emitter.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 103, in handler + return self.sign(operation_name, request) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 187, in sign + auth.add_auth(request) + File "/usr/local/lib/python3.9/site-packages/botocore/auth.py", line 407, in add_auth + raise NoCredentialsError() +botocore.exceptions.NoCredentialsError: Unable to locate credentials +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNSalvador_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 898, in _make_api_call + http, parsed_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 921, in _make_request + return self._endpoint.make_request(operation_model, request_dict) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 119, in make_request + return self._send_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 198, in _send_request + request = self.create_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 134, in create_request + self._event_emitter.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 103, in handler + return self.sign(operation_name, request) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 187, in sign + auth.add_auth(request) + File "/usr/local/lib/python3.9/site-packages/botocore/auth.py", line 407, in add_auth + raise NoCredentialsError() +botocore.exceptions.NoCredentialsError: Unable to locate credentials +INFO - Marking task as UP_FOR_RETRY. dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, execution_date=20221110T110356, start_date=20221110T111425, end_date=20221110T111426 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 2993 for task TaskLoad (Unable to locate credentials; 2243) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27203\357\200\27256.245412+00\357\200\27200/task_id=TaskLoad/attempt=2.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27203\357\200\27256.245412+00\357\200\27200/task_id=TaskLoad/attempt=2.log" new file mode 100644 index 00000000..ce901f34 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27203\357\200\27256.245412+00\357\200\27200/task_id=TaskLoad/attempt=2.log" @@ -0,0 +1,125 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 2 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T11:24:33.778290Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T11:03:56.245412Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "41c614bd-d7d6-379e-907a-636e84057a81"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "41c614bd-d7d6-379e-907a-636e84057a81"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d65a6d98-3ad2-475d-ad39-a0b48e301992"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, dagrun_id=manual__2022-11-10T11:03:56.245412+00:00, map_index=-1, run_start_date=2022-11-10 11:24:33.778290+00:00, try_number=2, job_id=3000, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 11:03:56.245412+00:00 +INFO - Started process 181 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskLoad', 'manual__2022-11-10T11:03:56.245412+00:00', '--job-id', '3000', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmp32zuzplz'] +INFO - Job 3000: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 34b830a2c34f +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T11:03:56.245412+00:00 +AIRFLOW_CTX_TRY_NUMBER=2 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T11:03:56.245412+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-10' - GBUNSalvador_dag_elt - alkemy-2022-broc +INFO - '2022-11-10' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-10' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f64ee3f6e50> +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-10' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-10' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '5tSMZQaqcrCzCddBSibreQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-10' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-10' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-10' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-10' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:5tSMZQaqcrCzCddBSibreQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221110T112438Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-10' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221110T112438Z +20221110/us-east-1/s3/aws4_request +7fd0f97f5183259ae1c4789c98a47319e4586f596a479e5d2074e0ba4ee611f3 +INFO - '2022-11-10' - botocore.auth - Signature: +c49be21cd99501659dd08f57d91088edb6059b0445c2121f6c7e4e86d2585a12 +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Sending http request: +INFO - '2022-11-10' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTPS connection (1): alkemy-2022-broc.s3.amazonaws.com:443 +INFO - '2022-11-10' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-10' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-10' - urllib3.connectionpool - https://alkemy-2022-broc.s3.amazonaws.com:443 "PUT /GBUNSalvador_process.txt HTTP/1.1" 200 0 +INFO - '2022-11-10' - botocore.parsers - Response headers: {'x-amz-id-2': 'hPy6mNzfTeZ3FVB+RlpJsw/qnxiY0EW5u8Jxwp+cxGmlq1/IIEyq79aPElRRHEOJhLkJO7MXdBtW816AXKV8ZQ==', 'x-amz-request-id': '1SEFRKCHCN3DHC7Y', 'Date': 'Thu, 10 Nov 2022 11:24:39 GMT', 'ETag': '"e6d48c6506aa72b0b309d7414a26eb79"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-10' - botocore.parsers - Response body: +b'' +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.retryhandler - No retry needed. +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, execution_date=20221110T110356, start_date=20221110T112433, end_date=20221110T112440 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskLoad airflow_run_id=manual__2022-11-10T11:03:56.245412+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskLoad: TaskMetadata(name='GBUNSalvador_dag_elt.TaskLoad', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskLoad', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskLoad', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskTransform'}, 'downstream_task_ids': set(), 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T11:24:40.807424Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "d65a6d98-3ad2-475d-ad39-a0b48e301992"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27203\357\200\27256.245412+00\357\200\27200/task_id=TaskTransform/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27203\357\200\27256.245412+00\357\200\27200/task_id=TaskTransform/attempt=1.log" new file mode 100644 index 00000000..bdfd595f --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27203\357\200\27256.245412+00\357\200\27200/task_id=TaskTransform/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T11:14:15.663334Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskLoad'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskExtract'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T11:03:56.245412Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "41c614bd-d7d6-379e-907a-636e84057a81"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "41c614bd-d7d6-379e-907a-636e84057a81"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c03a9db8-2ba2-4f69-9b1c-622c16e8b055"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskTransform, dagrun_id=manual__2022-11-10T11:03:56.245412+00:00, map_index=-1, run_start_date=2022-11-10 11:14:15.663334+00:00, try_number=1, job_id=2992, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 11:03:56.245412+00:00 +INFO - Started process 2238 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskTransform', 'manual__2022-11-10T11:03:56.245412+00:00', '--job-id', '2992', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpo4r1qqe0'] +INFO - Job 2992: Subtask TaskTransform +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host d1b6a3478c83 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskTransform +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T11:03:56.245412+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T11:03:56.245412+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Transform +INFO - ['GBUNSalvador', 'select.csv'] +INFO - GBUNSalvador +INFO - GBUNSalvador_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskTransform, execution_date=20221110T110356, start_date=20221110T111415, end_date=20221110T111424 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskTransform airflow_run_id=manual__2022-11-10T11:03:56.245412+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskTransform: TaskMetadata(name='GBUNSalvador_dag_elt.TaskTransform', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskTransform', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskTransform', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskExtract'}, 'downstream_task_ids': {'TaskLoad'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T11:14:24.105424Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "c03a9db8-2ba2-4f69-9b1c-622c16e8b055"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27209\357\200\27251.447390+00\357\200\27200/task_id=TaskExtract/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27209\357\200\27251.447390+00\357\200\27200/task_id=TaskExtract/attempt=1.log" new file mode 100644 index 00000000..daffbf46 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27209\357\200\27251.447390+00\357\200\27200/task_id=TaskExtract/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T11:09:52.892262Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T11:09:51.447390Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "914c79e0-af6e-35df-8bc7-3b62d6fca2f9"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "914c79e0-af6e-35df-8bc7-3b62d6fca2f9"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "860aaa39-de66-48a9-a71a-6817e87ffe16"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, dagrun_id=manual__2022-11-10T11:09:51.447390+00:00, map_index=-1, run_start_date=2022-11-10 11:09:52.892262+00:00, try_number=1, job_id=2985, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 11:09:51.447390+00:00 +INFO - Started process 2177 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskExtract', 'manual__2022-11-10T11:09:51.447390+00:00', '--job-id', '2985', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpgt3_nlk0'] +INFO - Job 2985: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host d1b6a3478c83 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T11:09:51.447390+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T11:09:51.447390+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-10' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, execution_date=20221110T110951, start_date=20221110T110952, end_date=20221110T110957 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskExtract airflow_run_id=manual__2022-11-10T11:09:51.447390+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskExtract: TaskMetadata(name='GBUNSalvador_dag_elt.TaskExtract', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskExtract', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskExtract', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'TaskTransform'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T11:09:57.279718Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "860aaa39-de66-48a9-a71a-6817e87ffe16"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27209\357\200\27251.447390+00\357\200\27200/task_id=TaskLoad/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27209\357\200\27251.447390+00\357\200\27200/task_id=TaskLoad/attempt=1.log" new file mode 100644 index 00000000..a0bc746d --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27209\357\200\27251.447390+00\357\200\27200/task_id=TaskLoad/attempt=1.log" @@ -0,0 +1,291 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T11:10:06.132025Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T11:09:51.447390Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "914c79e0-af6e-35df-8bc7-3b62d6fca2f9"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "914c79e0-af6e-35df-8bc7-3b62d6fca2f9"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "0fe0090c-2021-4fd0-a15c-fe05da482fa3"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, dagrun_id=manual__2022-11-10T11:09:51.447390+00:00, map_index=-1, run_start_date=2022-11-10 11:10:06.132025+00:00, try_number=1, job_id=2987, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 11:09:51.447390+00:00 +INFO - Started process 2187 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskLoad', 'manual__2022-11-10T11:09:51.447390+00:00', '--job-id', '2987', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpc7m3dtu7'] +INFO - Job 2987: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host d1b6a3478c83 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T11:09:51.447390+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T11:09:51.447390+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-10' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-10' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTP connection (1): 169.254.169.254:80 +INFO - '2022-11-10' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTP connection (2): 169.254.169.254:80 +INFO - '2022-11-10' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-10' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-10' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f228ee5f700> +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-10' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-10' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/dipa-s3/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'wsFSCtxe3weEe96IU5LOZg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/dipa-s3/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'dipa-s3'}}} +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-10' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/dipa-s3/GBUNSalvador_process.txt +INFO - '2022-11-10' - botocore.utils - URI updated to: https://dipa-s3.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-10' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 898, in _make_api_call + http, parsed_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 921, in _make_request + return self._endpoint.make_request(operation_model, request_dict) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 119, in make_request + return self._send_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 198, in _send_request + request = self.create_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 134, in create_request + self._event_emitter.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 103, in handler + return self.sign(operation_name, request) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 187, in sign + auth.add_auth(request) + File "/usr/local/lib/python3.9/site-packages/botocore/auth.py", line 407, in add_auth + raise NoCredentialsError() +botocore.exceptions.NoCredentialsError: Unable to locate credentials +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNSalvador_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 898, in _make_api_call + http, parsed_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 921, in _make_request + return self._endpoint.make_request(operation_model, request_dict) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 119, in make_request + return self._send_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 198, in _send_request + request = self.create_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 134, in create_request + self._event_emitter.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 103, in handler + return self.sign(operation_name, request) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 187, in sign + auth.add_auth(request) + File "/usr/local/lib/python3.9/site-packages/botocore/auth.py", line 407, in add_auth + raise NoCredentialsError() +botocore.exceptions.NoCredentialsError: Unable to locate credentials +INFO - Marking task as UP_FOR_RETRY. dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, execution_date=20221110T110951, start_date=20221110T111006, end_date=20221110T111007 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 2987 for task TaskLoad (Unable to locate credentials; 2187) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27209\357\200\27251.447390+00\357\200\27200/task_id=TaskLoad/attempt=2.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27209\357\200\27251.447390+00\357\200\27200/task_id=TaskLoad/attempt=2.log" new file mode 100644 index 00000000..6b7548c4 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27209\357\200\27251.447390+00\357\200\27200/task_id=TaskLoad/attempt=2.log" @@ -0,0 +1,292 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 2 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T11:20:07.954078Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T11:09:51.447390Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "914c79e0-af6e-35df-8bc7-3b62d6fca2f9"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "914c79e0-af6e-35df-8bc7-3b62d6fca2f9"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "253f7f6f-c4fd-486f-9b14-92c03c088c8f"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, dagrun_id=manual__2022-11-10T11:09:51.447390+00:00, map_index=-1, run_start_date=2022-11-10 11:20:07.954078+00:00, try_number=2, job_id=2995, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 11:09:51.447390+00:00 +INFO - Started process 2291 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskLoad', 'manual__2022-11-10T11:09:51.447390+00:00', '--job-id', '2995', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpeoqoy7l0'] +INFO - Job 2995: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host d1b6a3478c83 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T11:09:51.447390+00:00 +AIRFLOW_CTX_TRY_NUMBER=2 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T11:09:51.447390+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-10' - GBUNSalvador_dag_elt - dipa-s3 +INFO - '2022-11-10' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-10' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTP connection (1): 169.254.169.254:80 +INFO - '2022-11-10' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTP connection (2): 169.254.169.254:80 +INFO - '2022-11-10' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-10' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-10' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f228eecfe50> +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-10' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-10' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/dipa-s3/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '5tSMZQaqcrCzCddBSibreQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/dipa-s3/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'dipa-s3'}}} +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-10' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/dipa-s3/GBUNSalvador_process.txt +INFO - '2022-11-10' - botocore.utils - URI updated to: https://dipa-s3.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-10' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 898, in _make_api_call + http, parsed_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 921, in _make_request + return self._endpoint.make_request(operation_model, request_dict) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 119, in make_request + return self._send_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 198, in _send_request + request = self.create_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 134, in create_request + self._event_emitter.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 103, in handler + return self.sign(operation_name, request) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 187, in sign + auth.add_auth(request) + File "/usr/local/lib/python3.9/site-packages/botocore/auth.py", line 407, in add_auth + raise NoCredentialsError() +botocore.exceptions.NoCredentialsError: Unable to locate credentials +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNSalvador_dag_elt.py", line 110, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 898, in _make_api_call + http, parsed_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 921, in _make_request + return self._endpoint.make_request(operation_model, request_dict) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 119, in make_request + return self._send_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 198, in _send_request + request = self.create_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 134, in create_request + self._event_emitter.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 103, in handler + return self.sign(operation_name, request) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 187, in sign + auth.add_auth(request) + File "/usr/local/lib/python3.9/site-packages/botocore/auth.py", line 407, in add_auth + raise NoCredentialsError() +botocore.exceptions.NoCredentialsError: Unable to locate credentials +INFO - Marking task as UP_FOR_RETRY. dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, execution_date=20221110T110951, start_date=20221110T112007, end_date=20221110T112009 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 2995 for task TaskLoad (Unable to locate credentials; 2291) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27209\357\200\27251.447390+00\357\200\27200/task_id=TaskLoad/attempt=3.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27209\357\200\27251.447390+00\357\200\27200/task_id=TaskLoad/attempt=3.log" new file mode 100644 index 00000000..69093021 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27209\357\200\27251.447390+00\357\200\27200/task_id=TaskLoad/attempt=3.log" @@ -0,0 +1,125 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 3 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T11:30:10.047708Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T11:09:51.447390Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "914c79e0-af6e-35df-8bc7-3b62d6fca2f9"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "914c79e0-af6e-35df-8bc7-3b62d6fca2f9"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9c579cb0-4f28-4a60-bcb2-bfce33b4992a"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, dagrun_id=manual__2022-11-10T11:09:51.447390+00:00, map_index=-1, run_start_date=2022-11-10 11:30:10.047708+00:00, try_number=3, job_id=3167, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 11:09:51.447390+00:00 +INFO - Started process 1138 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskLoad', 'manual__2022-11-10T11:09:51.447390+00:00', '--job-id', '3167', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpoabhorfz'] +INFO - Job 3167: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 34b830a2c34f +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T11:09:51.447390+00:00 +AIRFLOW_CTX_TRY_NUMBER=3 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T11:09:51.447390+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-10' - GBUNSalvador_dag_elt - alkemy-2022-broc +INFO - '2022-11-10' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-10' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f64ee3f6e50> +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-10' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-10' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-10' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-10' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-10' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-10' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221110T113010Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-10' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221110T113010Z +20221110/us-east-1/s3/aws4_request +0ecd5d34aeca1b8193bf12eed3ab328e79d510c1d22961daf20a43a1016ab586 +INFO - '2022-11-10' - botocore.auth - Signature: +9c82edc8481e253edf74ebde2104f3d749b38746c313dc14e485d8c1c55510b2 +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Sending http request: +INFO - '2022-11-10' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTPS connection (1): alkemy-2022-broc.s3.amazonaws.com:443 +INFO - '2022-11-10' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-10' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-10' - urllib3.connectionpool - https://alkemy-2022-broc.s3.amazonaws.com:443 "PUT /GBUNSalvador_process.txt HTTP/1.1" 200 0 +INFO - '2022-11-10' - botocore.parsers - Response headers: {'x-amz-id-2': '/yhrMrPx2oD7w1eNoTbkm6mJY4IzmkkvcGCHSW9wSeMCsf986tY5nfOoEDMJKEqtVQ/tXqiIrUg=', 'x-amz-request-id': 'P7WFS190VG5XKJH4', 'Date': 'Thu, 10 Nov 2022 11:30:11 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-10' - botocore.parsers - Response body: +b'' +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.retryhandler - No retry needed. +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, execution_date=20221110T110951, start_date=20221110T113010, end_date=20221110T113012 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskLoad airflow_run_id=manual__2022-11-10T11:09:51.447390+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskLoad: TaskMetadata(name='GBUNSalvador_dag_elt.TaskLoad', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskLoad', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskLoad', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskTransform'}, 'downstream_task_ids': set(), 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T11:30:12.739886Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9c579cb0-4f28-4a60-bcb2-bfce33b4992a"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27209\357\200\27251.447390+00\357\200\27200/task_id=TaskTransform/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27209\357\200\27251.447390+00\357\200\27200/task_id=TaskTransform/attempt=1.log" new file mode 100644 index 00000000..64b140ae --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27209\357\200\27251.447390+00\357\200\27200/task_id=TaskTransform/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T11:09:57.992861Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskLoad'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskExtract'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T11:09:51.447390Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "914c79e0-af6e-35df-8bc7-3b62d6fca2f9"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "914c79e0-af6e-35df-8bc7-3b62d6fca2f9"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "504558b6-3f01-40da-ab71-a1a04b11516d"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskTransform, dagrun_id=manual__2022-11-10T11:09:51.447390+00:00, map_index=-1, run_start_date=2022-11-10 11:09:57.992861+00:00, try_number=1, job_id=2986, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 11:09:51.447390+00:00 +INFO - Started process 2182 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskTransform', 'manual__2022-11-10T11:09:51.447390+00:00', '--job-id', '2986', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpi5__wre8'] +INFO - Job 2986: Subtask TaskTransform +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host d1b6a3478c83 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskTransform +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T11:09:51.447390+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T11:09:51.447390+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Transform +INFO - ['GBUNSalvador', 'select.csv'] +INFO - GBUNSalvador +INFO - GBUNSalvador_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskTransform, execution_date=20221110T110951, start_date=20221110T110957, end_date=20221110T111004 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskTransform airflow_run_id=manual__2022-11-10T11:09:51.447390+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskTransform: TaskMetadata(name='GBUNSalvador_dag_elt.TaskTransform', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskTransform', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskTransform', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskExtract'}, 'downstream_task_ids': {'TaskLoad'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T11:10:04.273413Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "504558b6-3f01-40da-ab71-a1a04b11516d"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27226\357\200\27238.963926+00\357\200\27200/task_id=TaskExtract/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27226\357\200\27238.963926+00\357\200\27200/task_id=TaskExtract/attempt=1.log" new file mode 100644 index 00000000..f6cf4939 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27226\357\200\27238.963926+00\357\200\27200/task_id=TaskExtract/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T11:26:40.402978Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T11:26:38.963926Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "fc43a5eb-c4b0-36ca-a822-c06a3c89fec3"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "fc43a5eb-c4b0-36ca-a822-c06a3c89fec3"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "eb1c2eb4-d013-4ca3-9fa0-02ae46ecd5a2"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, dagrun_id=manual__2022-11-10T11:26:38.963926+00:00, map_index=-1, run_start_date=2022-11-10 11:26:40.402978+00:00, try_number=1, job_id=3075, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 11:26:38.963926+00:00 +INFO - Started process 612 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskExtract', 'manual__2022-11-10T11:26:38.963926+00:00', '--job-id', '3075', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpfcleqgkm'] +INFO - Job 3075: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 34b830a2c34f +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T11:26:38.963926+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T11:26:38.963926+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-10' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, execution_date=20221110T112638, start_date=20221110T112640, end_date=20221110T112644 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskExtract airflow_run_id=manual__2022-11-10T11:26:38.963926+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskExtract: TaskMetadata(name='GBUNSalvador_dag_elt.TaskExtract', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskExtract', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskExtract', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'TaskTransform'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T11:26:44.725353Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "eb1c2eb4-d013-4ca3-9fa0-02ae46ecd5a2"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27226\357\200\27238.963926+00\357\200\27200/task_id=TaskLoad/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27226\357\200\27238.963926+00\357\200\27200/task_id=TaskLoad/attempt=1.log" new file mode 100644 index 00000000..07c445c8 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27226\357\200\27238.963926+00\357\200\27200/task_id=TaskLoad/attempt=1.log" @@ -0,0 +1,125 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T11:27:04.880165Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T11:26:38.963926Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "fc43a5eb-c4b0-36ca-a822-c06a3c89fec3"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "fc43a5eb-c4b0-36ca-a822-c06a3c89fec3"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8a937e4f-346f-4422-b2d8-c39f8c5c4092"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, dagrun_id=manual__2022-11-10T11:26:38.963926+00:00, map_index=-1, run_start_date=2022-11-10 11:27:04.880165+00:00, try_number=1, job_id=3091, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 11:26:38.963926+00:00 +INFO - Started process 699 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskLoad', 'manual__2022-11-10T11:26:38.963926+00:00', '--job-id', '3091', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmp63oxxdmi'] +INFO - Job 3091: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 34b830a2c34f +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T11:26:38.963926+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T11:26:38.963926+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-10' - GBUNSalvador_dag_elt - alkemy-2022-broc +INFO - '2022-11-10' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-10' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f64ee386700> +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-10' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-10' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'BhYhBcSul9hrq9lNzgieHQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-10' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-10' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-10' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-10' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:BhYhBcSul9hrq9lNzgieHQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221110T112706Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-10' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221110T112706Z +20221110/us-east-1/s3/aws4_request +418deea4b96e53309180d2bbadcc71eddc75a2172ec80495b8c193184185b909 +INFO - '2022-11-10' - botocore.auth - Signature: +25cfe58abc1a01561bd2a81cf8ed3871e5d1c6f634be8d102fdbe9d55714f79d +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Sending http request: +INFO - '2022-11-10' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTPS connection (1): alkemy-2022-broc.s3.amazonaws.com:443 +INFO - '2022-11-10' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-10' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-10' - urllib3.connectionpool - https://alkemy-2022-broc.s3.amazonaws.com:443 "PUT /GBUNSalvador_process.txt HTTP/1.1" 200 0 +INFO - '2022-11-10' - botocore.parsers - Response headers: {'x-amz-id-2': 'acf6jSgzg78wKhIrBYoYjwyhvztgxk4rjx14SL2GoekzqAKDfVApOMunAm0F+XBWZmJGqpWRvBw=', 'x-amz-request-id': 'KNZKZ48MSPV1VRAK', 'Date': 'Thu, 10 Nov 2022 11:27:06 GMT', 'ETag': '"06162105c4ae97d86babd94dce089e1d"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-10' - botocore.parsers - Response body: +b'' +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.retryhandler - No retry needed. +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, execution_date=20221110T112638, start_date=20221110T112704, end_date=20221110T112708 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskLoad airflow_run_id=manual__2022-11-10T11:26:38.963926+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskLoad: TaskMetadata(name='GBUNSalvador_dag_elt.TaskLoad', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskLoad', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskLoad', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskTransform'}, 'downstream_task_ids': set(), 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T11:27:08.091046Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8a937e4f-346f-4422-b2d8-c39f8c5c4092"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27226\357\200\27238.963926+00\357\200\27200/task_id=TaskTransform/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27226\357\200\27238.963926+00\357\200\27200/task_id=TaskTransform/attempt=1.log" new file mode 100644 index 00000000..a33fe604 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=manual__2022-11-10T11\357\200\27226\357\200\27238.963926+00\357\200\27200/task_id=TaskTransform/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T11:26:46.356899Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": true}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskLoad'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskExtract'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T11:26:38.963926Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "fc43a5eb-c4b0-36ca-a822-c06a3c89fec3"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "fc43a5eb-c4b0-36ca-a822-c06a3c89fec3"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "45f7fc04-52ec-4ab6-8e0d-232f246b8308"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskTransform, dagrun_id=manual__2022-11-10T11:26:38.963926+00:00, map_index=-1, run_start_date=2022-11-10 11:26:46.356899+00:00, try_number=1, job_id=3079, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 11:26:38.963926+00:00 +INFO - Started process 631 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskTransform', 'manual__2022-11-10T11:26:38.963926+00:00', '--job-id', '3079', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmplioq3mg8'] +INFO - Job 3079: Subtask TaskTransform +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 34b830a2c34f +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskTransform +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T11:26:38.963926+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=manual__2022-11-10T11:26:38.963926+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Transform +INFO - ['GBUNSalvador', 'select.csv'] +INFO - GBUNSalvador +INFO - GBUNSalvador_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskTransform, execution_date=20221110T112638, start_date=20221110T112646, end_date=20221110T112703 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskTransform airflow_run_id=manual__2022-11-10T11:26:38.963926+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskTransform: TaskMetadata(name='GBUNSalvador_dag_elt.TaskTransform', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskTransform', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskTransform', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskExtract'}, 'downstream_task_ids': {'TaskLoad'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T11:27:03.420039Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "45f7fc04-52ec-4ab6-8e0d-232f246b8308"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27208\357\200\27234.199951+00\357\200\27200/task_id=TaskExtract/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27208\357\200\27234.199951+00\357\200\27200/task_id=TaskExtract/attempt=1.log" new file mode 100644 index 00000000..4fbb8c31 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27208\357\200\27234.199951+00\357\200\27200/task_id=TaskExtract/attempt=1.log" @@ -0,0 +1,51 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:08:34.596737Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "_TaskDecorator(function=, operator_class=, multiple_outputs=False, kwargs={'task_id': 'extract'})", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "_TaskDecorator(function=, operator_class=, multiple_outputs=False, kwargs={'task_id': 'extract'})", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T05:08:34.199951Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "6563c736-0d06-3c74-ac9a-b03a6ba5f7b5"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "6563c736-0d06-3c74-ac9a-b03a6ba5f7b5"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": {"decorator_name": "task", "function": "<>", "kwargs": {"task_id": "extract"}, "multiple_outputs": false, "operator_class": "<>"}, "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": {"decorator_name": "task", "function": "<>", "kwargs": {"task_id": "extract"}, "multiple_outputs": false, "operator_class": "<>"}, "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "8f9e67c2-24b1-4bb5-a863-6007f8a68646"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, dagrun_id=scheduled__2022-11-10T05:08:34.199951+00:00, map_index=-1, run_start_date=2022-11-10 06:08:34.596737+00:00, try_number=1, job_id=578, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 05:08:34.199951+00:00 +INFO - Started process 1105 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskExtract', 'scheduled__2022-11-10T05:08:34.199951+00:00', '--job-id', '578', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmphm5kza6o'] +INFO - Job 578: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T05:08:34.199951+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T05:08:34.199951+00:00 +INFO - Done. Returned value was: {{ task_instance.xcom_pull(task_ids='extract', dag_id='adhoc_airflow', key='return_value') }} +ERROR - Could not serialize the XCom value into JSON. If you are using pickle instead of JSON for XCom, then you need to enable pickle support for XCom in your airflow config. +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/utils/session.py", line 72, in wrapper + return func(*args, **kwargs) + File "/usr/local/lib/python3.9/site-packages/airflow/models/taskinstance.py", line 2378, in xcom_push + XCom.set( + File "/usr/local/lib/python3.9/site-packages/airflow/utils/session.py", line 72, in wrapper + return func(*args, **kwargs) + File "/usr/local/lib/python3.9/site-packages/airflow/models/xcom.py", line 206, in set + value = cls.serialize_value( + File "/usr/local/lib/python3.9/site-packages/airflow/models/xcom.py", line 597, in serialize_value + return json.dumps(value).encode('UTF-8') + File "/usr/local/lib/python3.9/json/__init__.py", line 231, in dumps + return _default_encoder.encode(obj) + File "/usr/local/lib/python3.9/json/encoder.py", line 199, in encode + chunks = self.iterencode(o, _one_shot=True) + File "/usr/local/lib/python3.9/json/encoder.py", line 257, in iterencode + return _iterencode(o, 0) + File "/usr/local/lib/python3.9/json/encoder.py", line 179, in default + raise TypeError(f'Object of type {o.__class__.__name__} ' +TypeError: Object of type PlainXComArg is not JSON serializable +INFO - Marking task as UP_FOR_RETRY. dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, execution_date=20221110T050834, start_date=20221110T060834, end_date=20221110T060835 +ERROR - Failed to execute job 578 for task TaskExtract (Object of type PlainXComArg is not JSON serializable; 1105) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskExtract/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskExtract/attempt=1.log" new file mode 100644 index 00000000..aea8dbd8 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskExtract/attempt=1.log" @@ -0,0 +1,51 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:13:21.036300Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "_TaskDecorator(function=, operator_class=, multiple_outputs=False, kwargs={'task_id': 'extract'})", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "_TaskDecorator(function=, operator_class=, multiple_outputs=False, kwargs={'task_id': 'extract'})", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T05:12:53.294512Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "e9155918-c697-3e6b-9412-e58a42a96dee"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "e9155918-c697-3e6b-9412-e58a42a96dee"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": {"decorator_name": "task", "function": "<>", "kwargs": {"task_id": "extract"}, "multiple_outputs": false, "operator_class": "<>"}, "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": {"decorator_name": "task", "function": "<>", "kwargs": {"task_id": "extract"}, "multiple_outputs": false, "operator_class": "<>"}, "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "345dd6a5-93ab-45cd-a0b2-846f1de04626"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, dagrun_id=scheduled__2022-11-10T05:12:53.294512+00:00, map_index=-1, run_start_date=2022-11-10 06:13:21.036300+00:00, try_number=1, job_id=582, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 05:12:53.294512+00:00 +INFO - Started process 1616 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskExtract', 'scheduled__2022-11-10T05:12:53.294512+00:00', '--job-id', '582', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpj1krvcy5'] +INFO - Job 582: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T05:12:53.294512+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T05:12:53.294512+00:00 +INFO - Done. Returned value was: {{ task_instance.xcom_pull(task_ids='extract', dag_id='adhoc_airflow', key='return_value') }} +ERROR - Could not serialize the XCom value into JSON. If you are using pickle instead of JSON for XCom, then you need to enable pickle support for XCom in your airflow config. +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/utils/session.py", line 72, in wrapper + return func(*args, **kwargs) + File "/usr/local/lib/python3.9/site-packages/airflow/models/taskinstance.py", line 2378, in xcom_push + XCom.set( + File "/usr/local/lib/python3.9/site-packages/airflow/utils/session.py", line 72, in wrapper + return func(*args, **kwargs) + File "/usr/local/lib/python3.9/site-packages/airflow/models/xcom.py", line 206, in set + value = cls.serialize_value( + File "/usr/local/lib/python3.9/site-packages/airflow/models/xcom.py", line 597, in serialize_value + return json.dumps(value).encode('UTF-8') + File "/usr/local/lib/python3.9/json/__init__.py", line 231, in dumps + return _default_encoder.encode(obj) + File "/usr/local/lib/python3.9/json/encoder.py", line 199, in encode + chunks = self.iterencode(o, _one_shot=True) + File "/usr/local/lib/python3.9/json/encoder.py", line 257, in iterencode + return _iterencode(o, 0) + File "/usr/local/lib/python3.9/json/encoder.py", line 179, in default + raise TypeError(f'Object of type {o.__class__.__name__} ' +TypeError: Object of type PlainXComArg is not JSON serializable +INFO - Marking task as UP_FOR_RETRY. dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, execution_date=20221110T051253, start_date=20221110T061321, end_date=20221110T061321 +ERROR - Failed to execute job 582 for task TaskExtract (Object of type PlainXComArg is not JSON serializable; 1616) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskExtract/attempt=2.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskExtract/attempt=2.log" new file mode 100644 index 00000000..916ce42b --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskExtract/attempt=2.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 2 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:23:23.233629Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T05:12:53.294512Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "e9155918-c697-3e6b-9412-e58a42a96dee"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "e9155918-c697-3e6b-9412-e58a42a96dee"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9803c961-679f-4490-9742-7a4738ba816d"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, dagrun_id=scheduled__2022-11-10T05:12:53.294512+00:00, map_index=-1, run_start_date=2022-11-10 06:23:23.233629+00:00, try_number=2, job_id=598, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 05:12:53.294512+00:00 +INFO - Started process 2652 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskExtract', 'scheduled__2022-11-10T05:12:53.294512+00:00', '--job-id', '598', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmp34_5wd9k'] +INFO - Job 598: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T05:12:53.294512+00:00 +AIRFLOW_CTX_TRY_NUMBER=2 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T05:12:53.294512+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-10' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, execution_date=20221110T051253, start_date=20221110T062323, end_date=20221110T062326 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskExtract airflow_run_id=scheduled__2022-11-10T05:12:53.294512+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskExtract: TaskMetadata(name='GBUNSalvador_dag_elt.TaskExtract', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskExtract', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskExtract', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'TaskTransform'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T06:23:26.513894Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9803c961-679f-4490-9742-7a4738ba816d"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskLoad/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskLoad/attempt=1.log" new file mode 100644 index 00000000..e92af518 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskLoad/attempt=1.log" @@ -0,0 +1,124 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:23:32.685070Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T05:12:53.294512Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "e9155918-c697-3e6b-9412-e58a42a96dee"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "e9155918-c697-3e6b-9412-e58a42a96dee"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "82d0e649-2ec5-4721-b1c3-ea2620836804"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, dagrun_id=scheduled__2022-11-10T05:12:53.294512+00:00, map_index=-1, run_start_date=2022-11-10 06:23:32.685070+00:00, try_number=1, job_id=603, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 05:12:53.294512+00:00 +INFO - Started process 2704 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskLoad', 'scheduled__2022-11-10T05:12:53.294512+00:00', '--job-id', '603', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmp4hm321q4'] +INFO - Job 603: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T05:12:53.294512+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T05:12:53.294512+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-10' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-10' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fcc542868b0> +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-10' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-10' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/dipa-s3/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'N6V18ZBB5L+/Ym0KCsbx3Q==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/dipa-s3/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'dipa-s3'}}} +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-10' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/dipa-s3/GBUNSalvador_process.txt +INFO - '2022-11-10' - botocore.utils - URI updated to: https://dipa-s3.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-10' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-10' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:N6V18ZBB5L+/Ym0KCsbx3Q== +host:dipa-s3.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221110T062333Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-10' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221110T062333Z +20221110/us-east-1/s3/aws4_request +130acf3f59fac28373d69bfa2811504c066d623a071fe74a8012263f2dd99480 +INFO - '2022-11-10' - botocore.auth - Signature: +abaafc16c78f783b9a0049bf42590791869b2b256b5982936712fea935d75621 +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Sending http request: +INFO - '2022-11-10' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTPS connection (1): dipa-s3.s3.amazonaws.com:443 +INFO - '2022-11-10' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-10' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-10' - urllib3.connectionpool - https://dipa-s3.s3.amazonaws.com:443 "PUT /GBUNSalvador_process.txt HTTP/1.1" 200 0 +INFO - '2022-11-10' - botocore.parsers - Response headers: {'x-amz-id-2': 'pzf/hyK+x0oi8/YWX3pgQsj030/bB0+/kzp1DqgcI+RuW0gOXgJ4cVg3M4ybAeyN+hl30emHlGA=', 'x-amz-request-id': 'XFKHNNDASZHH3BRE', 'Date': 'Thu, 10 Nov 2022 06:23:33 GMT', 'ETag': '"37a575f19041e4bfbf626d0a0ac6f1dd"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-10' - botocore.parsers - Response body: +b'' +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.retryhandler - No retry needed. +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, execution_date=20221110T051253, start_date=20221110T062332, end_date=20221110T062334 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskLoad airflow_run_id=scheduled__2022-11-10T05:12:53.294512+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskLoad: TaskMetadata(name='GBUNSalvador_dag_elt.TaskLoad', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskLoad', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskLoad', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskTransform'}, 'downstream_task_ids': set(), 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T06:23:34.951641Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "82d0e649-2ec5-4721-b1c3-ea2620836804"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskTransform/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskTransform/attempt=1.log" new file mode 100644 index 00000000..dae7b426 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T05\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskTransform/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T06:23:27.608004Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskLoad'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskExtract'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T05:12:53.294512Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "e9155918-c697-3e6b-9412-e58a42a96dee"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "e9155918-c697-3e6b-9412-e58a42a96dee"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9d62849f-fa8a-4469-8755-0e16228be393"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskTransform, dagrun_id=scheduled__2022-11-10T05:12:53.294512+00:00, map_index=-1, run_start_date=2022-11-10 06:23:27.608004+00:00, try_number=1, job_id=601, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 05:12:53.294512+00:00 +INFO - Started process 2679 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskTransform', 'scheduled__2022-11-10T05:12:53.294512+00:00', '--job-id', '601', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmp_68fgaab'] +INFO - Job 601: Subtask TaskTransform +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskTransform +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T05:12:53.294512+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T05:12:53.294512+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Transform +INFO - ['GBUNSalvador', 'select.csv'] +INFO - GBUNSalvador +INFO - GBUNSalvador_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskTransform, execution_date=20221110T051253, start_date=20221110T062327, end_date=20221110T062332 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskTransform airflow_run_id=scheduled__2022-11-10T05:12:53.294512+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskTransform: TaskMetadata(name='GBUNSalvador_dag_elt.TaskTransform', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskTransform', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskTransform', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskExtract'}, 'downstream_task_ids': {'TaskLoad'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T06:23:32.025991Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9d62849f-fa8a-4469-8755-0e16228be393"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T06\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskExtract/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T06\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskExtract/attempt=1.log" new file mode 100644 index 00000000..3dcbd95a --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T06\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskExtract/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T07:12:54.231062Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T06:12:53.294512Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "27698066-7e10-3a45-8186-703ff81de1af"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "27698066-7e10-3a45-8186-703ff81de1af"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "db10499d-8d4a-4e96-a578-a2fc1c41f608"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, dagrun_id=scheduled__2022-11-10T06:12:53.294512+00:00, map_index=-1, run_start_date=2022-11-10 07:12:54.231062+00:00, try_number=1, job_id=613, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 06:12:53.294512+00:00 +INFO - Started process 7600 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskExtract', 'scheduled__2022-11-10T06:12:53.294512+00:00', '--job-id', '613', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmplfpm71bn'] +INFO - Job 613: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T06:12:53.294512+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T06:12:53.294512+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-10' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, execution_date=20221110T061253, start_date=20221110T071254, end_date=20221110T071257 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskExtract airflow_run_id=scheduled__2022-11-10T06:12:53.294512+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskExtract: TaskMetadata(name='GBUNSalvador_dag_elt.TaskExtract', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskExtract', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskExtract', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'TaskTransform'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T07:12:57.327574Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "db10499d-8d4a-4e96-a578-a2fc1c41f608"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T06\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskLoad/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T06\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskLoad/attempt=1.log" new file mode 100644 index 00000000..dd74c609 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T06\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskLoad/attempt=1.log" @@ -0,0 +1,124 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T07:13:03.884357Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T06:12:53.294512Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "27698066-7e10-3a45-8186-703ff81de1af"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "27698066-7e10-3a45-8186-703ff81de1af"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b0c039b3-c5d6-4b93-920f-879ade43c4c6"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, dagrun_id=scheduled__2022-11-10T06:12:53.294512+00:00, map_index=-1, run_start_date=2022-11-10 07:13:03.884357+00:00, try_number=1, job_id=615, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 06:12:53.294512+00:00 +INFO - Started process 7610 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskLoad', 'scheduled__2022-11-10T06:12:53.294512+00:00', '--job-id', '615', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmp6wa49_c4'] +INFO - Job 615: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T06:12:53.294512+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T06:12:53.294512+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-10' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-10' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7fcc54278700> +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-10' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-10' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/dipa-s3/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'MfpOpeVk3IfVi6Cjxovvbg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/dipa-s3/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'dipa-s3'}}} +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-10' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/dipa-s3/GBUNSalvador_process.txt +INFO - '2022-11-10' - botocore.utils - URI updated to: https://dipa-s3.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-10' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-10' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:MfpOpeVk3IfVi6Cjxovvbg== +host:dipa-s3.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221110T071304Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-10' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221110T071304Z +20221110/us-east-1/s3/aws4_request +6519476e48511acae5daa25c4912abb292cdeeda05f02e8758dcc6007263ea63 +INFO - '2022-11-10' - botocore.auth - Signature: +b09096267cb73656e3847441736582ab2a43274f8d6249abdc1faa4ba1c83df2 +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Sending http request: +INFO - '2022-11-10' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTPS connection (1): dipa-s3.s3.amazonaws.com:443 +INFO - '2022-11-10' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-10' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-10' - urllib3.connectionpool - https://dipa-s3.s3.amazonaws.com:443 "PUT /GBUNSalvador_process.txt HTTP/1.1" 200 0 +INFO - '2022-11-10' - botocore.parsers - Response headers: {'x-amz-id-2': 'FISKpGNU92eshgjntX+hJUxZ0OsqiNHo+U2+h7lBemhSe3BYfZ3YGnCOFEbl88gkXHQ+yMmHUjU=', 'x-amz-request-id': '0W4VPFRB7NAHQHW8', 'Date': 'Thu, 10 Nov 2022 07:13:04 GMT', 'ETag': '"31fa4ea5e564dc87d58ba0a3c68bef6e"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-10' - botocore.parsers - Response body: +b'' +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.retryhandler - No retry needed. +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, execution_date=20221110T061253, start_date=20221110T071303, end_date=20221110T071305 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskLoad airflow_run_id=scheduled__2022-11-10T06:12:53.294512+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskLoad: TaskMetadata(name='GBUNSalvador_dag_elt.TaskLoad', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskLoad', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskLoad', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskTransform'}, 'downstream_task_ids': set(), 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T07:13:05.840212Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "b0c039b3-c5d6-4b93-920f-879ade43c4c6"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T06\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskTransform/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T06\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskTransform/attempt=1.log" new file mode 100644 index 00000000..d454bdda --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T06\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskTransform/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T07:12:58.963527Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskLoad'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskExtract'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T06:12:53.294512Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "27698066-7e10-3a45-8186-703ff81de1af"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "27698066-7e10-3a45-8186-703ff81de1af"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bb84745f-70ed-4d8c-a0da-64737ec27ffc"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskTransform, dagrun_id=scheduled__2022-11-10T06:12:53.294512+00:00, map_index=-1, run_start_date=2022-11-10 07:12:58.963527+00:00, try_number=1, job_id=614, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 06:12:53.294512+00:00 +INFO - Started process 7605 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskTransform', 'scheduled__2022-11-10T06:12:53.294512+00:00', '--job-id', '614', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpcl3zcgel'] +INFO - Job 614: Subtask TaskTransform +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 1fc2f66b12c6 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskTransform +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T06:12:53.294512+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T06:12:53.294512+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Transform +INFO - ['GBUNSalvador', 'select.csv'] +INFO - GBUNSalvador +INFO - GBUNSalvador_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskTransform, execution_date=20221110T061253, start_date=20221110T071258, end_date=20221110T071303 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskTransform airflow_run_id=scheduled__2022-11-10T06:12:53.294512+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskTransform: TaskMetadata(name='GBUNSalvador_dag_elt.TaskTransform', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskTransform', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskTransform', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskExtract'}, 'downstream_task_ids': {'TaskLoad'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T07:13:03.185614Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "bb84745f-70ed-4d8c-a0da-64737ec27ffc"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T07\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskExtract/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T07\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskExtract/attempt=1.log" new file mode 100644 index 00000000..ffb3544a --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T07\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskExtract/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T08:12:54.535306Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T07:12:53.294512Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "52cc4219-6c84-325f-bc49-6c6549866965"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "52cc4219-6c84-325f-bc49-6c6549866965"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9645daa7-9473-4cf8-bec4-baf37e36ec9e"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, dagrun_id=scheduled__2022-11-10T07:12:53.294512+00:00, map_index=-1, run_start_date=2022-11-10 08:12:54.535306+00:00, try_number=1, job_id=621, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 07:12:53.294512+00:00 +INFO - Started process 2660 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskExtract', 'scheduled__2022-11-10T07:12:53.294512+00:00', '--job-id', '621', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpqbzf9pve'] +INFO - Job 621: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host d1b6a3478c83 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T07:12:53.294512+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T07:12:53.294512+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-10' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, execution_date=20221110T071253, start_date=20221110T081254, end_date=20221110T081258 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskExtract airflow_run_id=scheduled__2022-11-10T07:12:53.294512+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskExtract: TaskMetadata(name='GBUNSalvador_dag_elt.TaskExtract', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskExtract', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskExtract', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'TaskTransform'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T08:12:58.733504Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "9645daa7-9473-4cf8-bec4-baf37e36ec9e"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T07\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskLoad/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T07\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskLoad/attempt=1.log" new file mode 100644 index 00000000..6ee4be1b --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T07\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskLoad/attempt=1.log" @@ -0,0 +1,291 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T08:13:04.531377Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T07:12:53.294512Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "52cc4219-6c84-325f-bc49-6c6549866965"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "52cc4219-6c84-325f-bc49-6c6549866965"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "5a488605-ff78-46f2-bfb8-4c0d085f6796"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, dagrun_id=scheduled__2022-11-10T07:12:53.294512+00:00, map_index=-1, run_start_date=2022-11-10 08:13:04.531377+00:00, try_number=1, job_id=623, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 07:12:53.294512+00:00 +INFO - Started process 2675 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskLoad', 'scheduled__2022-11-10T07:12:53.294512+00:00', '--job-id', '623', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpszc2ptv6'] +INFO - Job 623: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host d1b6a3478c83 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T07:12:53.294512+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T07:12:53.294512+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-10' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-10' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTP connection (1): 169.254.169.254:80 +INFO - '2022-11-10' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTP connection (2): 169.254.169.254:80 +INFO - '2022-11-10' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-10' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-10' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f228ee62700> +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-10' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-10' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/dipa-s3/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'cQCLlvXu2mBXUimE4Yw1Vg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/dipa-s3/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'dipa-s3'}}} +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-10' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/dipa-s3/GBUNSalvador_process.txt +INFO - '2022-11-10' - botocore.utils - URI updated to: https://dipa-s3.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-10' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 898, in _make_api_call + http, parsed_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 921, in _make_request + return self._endpoint.make_request(operation_model, request_dict) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 119, in make_request + return self._send_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 198, in _send_request + request = self.create_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 134, in create_request + self._event_emitter.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 103, in handler + return self.sign(operation_name, request) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 187, in sign + auth.add_auth(request) + File "/usr/local/lib/python3.9/site-packages/botocore/auth.py", line 407, in add_auth + raise NoCredentialsError() +botocore.exceptions.NoCredentialsError: Unable to locate credentials +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNSalvador_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 898, in _make_api_call + http, parsed_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 921, in _make_request + return self._endpoint.make_request(operation_model, request_dict) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 119, in make_request + return self._send_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 198, in _send_request + request = self.create_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 134, in create_request + self._event_emitter.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 103, in handler + return self.sign(operation_name, request) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 187, in sign + auth.add_auth(request) + File "/usr/local/lib/python3.9/site-packages/botocore/auth.py", line 407, in add_auth + raise NoCredentialsError() +botocore.exceptions.NoCredentialsError: Unable to locate credentials +INFO - Marking task as UP_FOR_RETRY. dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, execution_date=20221110T071253, start_date=20221110T081304, end_date=20221110T081305 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 623 for task TaskLoad (Unable to locate credentials; 2675) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T07\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskLoad/attempt=2.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T07\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskLoad/attempt=2.log" new file mode 100644 index 00000000..f95a038e --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T07\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskLoad/attempt=2.log" @@ -0,0 +1,291 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 2 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T08:23:06.628755Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T07:12:53.294512Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "52cc4219-6c84-325f-bc49-6c6549866965"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "52cc4219-6c84-325f-bc49-6c6549866965"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f106da8e-d1c3-4e3e-b6ad-f603375cafcc"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, dagrun_id=scheduled__2022-11-10T07:12:53.294512+00:00, map_index=-1, run_start_date=2022-11-10 08:23:06.628755+00:00, try_number=2, job_id=625, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 07:12:53.294512+00:00 +INFO - Started process 4192 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskLoad', 'scheduled__2022-11-10T07:12:53.294512+00:00', '--job-id', '625', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmprno2ta9n'] +INFO - Job 625: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host d1b6a3478c83 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T07:12:53.294512+00:00 +AIRFLOW_CTX_TRY_NUMBER=2 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T07:12:53.294512+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-10' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-10' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTP connection (1): 169.254.169.254:80 +INFO - '2022-11-10' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTP connection (2): 169.254.169.254:80 +INFO - '2022-11-10' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-10' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-10' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f228eed2e50> +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-10' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-10' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/dipa-s3/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'cQCLlvXu2mBXUimE4Yw1Vg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/dipa-s3/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'dipa-s3'}}} +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-10' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/dipa-s3/GBUNSalvador_process.txt +INFO - '2022-11-10' - botocore.utils - URI updated to: https://dipa-s3.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-10' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 898, in _make_api_call + http, parsed_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 921, in _make_request + return self._endpoint.make_request(operation_model, request_dict) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 119, in make_request + return self._send_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 198, in _send_request + request = self.create_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 134, in create_request + self._event_emitter.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 103, in handler + return self.sign(operation_name, request) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 187, in sign + auth.add_auth(request) + File "/usr/local/lib/python3.9/site-packages/botocore/auth.py", line 407, in add_auth + raise NoCredentialsError() +botocore.exceptions.NoCredentialsError: Unable to locate credentials +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNSalvador_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 898, in _make_api_call + http, parsed_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 921, in _make_request + return self._endpoint.make_request(operation_model, request_dict) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 119, in make_request + return self._send_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 198, in _send_request + request = self.create_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 134, in create_request + self._event_emitter.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 103, in handler + return self.sign(operation_name, request) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 187, in sign + auth.add_auth(request) + File "/usr/local/lib/python3.9/site-packages/botocore/auth.py", line 407, in add_auth + raise NoCredentialsError() +botocore.exceptions.NoCredentialsError: Unable to locate credentials +INFO - Marking task as UP_FOR_RETRY. dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, execution_date=20221110T071253, start_date=20221110T082306, end_date=20221110T082307 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 625 for task TaskLoad (Unable to locate credentials; 4192) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T07\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskLoad/attempt=3.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T07\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskLoad/attempt=3.log" new file mode 100644 index 00000000..09b81cd9 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T07\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskLoad/attempt=3.log" @@ -0,0 +1,291 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 3 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T11:03:53.766326Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T07:12:53.294512Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "52cc4219-6c84-325f-bc49-6c6549866965"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "52cc4219-6c84-325f-bc49-6c6549866965"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "fbc18d58-5b9e-4d8e-bc29-3518aa95ce34"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, dagrun_id=scheduled__2022-11-10T07:12:53.294512+00:00, map_index=-1, run_start_date=2022-11-10 11:03:53.766326+00:00, try_number=3, job_id=2983, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 07:12:53.294512+00:00 +INFO - Started process 2130 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskLoad', 'scheduled__2022-11-10T07:12:53.294512+00:00', '--job-id', '2983', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpx5rv4mzl'] +INFO - Job 2983: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host d1b6a3478c83 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T07:12:53.294512+00:00 +AIRFLOW_CTX_TRY_NUMBER=3 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T07:12:53.294512+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-10' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-10' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTP connection (1): 169.254.169.254:80 +INFO - '2022-11-10' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTP connection (2): 169.254.169.254:80 +INFO - '2022-11-10' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-10' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-10' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f228eeb14c0> +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-10' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-10' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/dipa-s3/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'cQCLlvXu2mBXUimE4Yw1Vg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/dipa-s3/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'dipa-s3'}}} +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-10' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/dipa-s3/GBUNSalvador_process.txt +INFO - '2022-11-10' - botocore.utils - URI updated to: https://dipa-s3.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-10' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 898, in _make_api_call + http, parsed_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 921, in _make_request + return self._endpoint.make_request(operation_model, request_dict) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 119, in make_request + return self._send_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 198, in _send_request + request = self.create_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 134, in create_request + self._event_emitter.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 103, in handler + return self.sign(operation_name, request) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 187, in sign + auth.add_auth(request) + File "/usr/local/lib/python3.9/site-packages/botocore/auth.py", line 407, in add_auth + raise NoCredentialsError() +botocore.exceptions.NoCredentialsError: Unable to locate credentials +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNSalvador_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 898, in _make_api_call + http, parsed_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 921, in _make_request + return self._endpoint.make_request(operation_model, request_dict) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 119, in make_request + return self._send_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 198, in _send_request + request = self.create_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 134, in create_request + self._event_emitter.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 103, in handler + return self.sign(operation_name, request) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 187, in sign + auth.add_auth(request) + File "/usr/local/lib/python3.9/site-packages/botocore/auth.py", line 407, in add_auth + raise NoCredentialsError() +botocore.exceptions.NoCredentialsError: Unable to locate credentials +INFO - Marking task as UP_FOR_RETRY. dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, execution_date=20221110T071253, start_date=20221110T110353, end_date=20221110T110355 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 2983 for task TaskLoad (Unable to locate credentials; 2130) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T07\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskLoad/attempt=4.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T07\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskLoad/attempt=4.log" new file mode 100644 index 00000000..6d76831f --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T07\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskLoad/attempt=4.log" @@ -0,0 +1,291 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 4 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T11:13:56.657454Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T07:12:53.294512Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "52cc4219-6c84-325f-bc49-6c6549866965"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "52cc4219-6c84-325f-bc49-6c6549866965"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "45315931-75bc-4a1d-9a9c-bbe7ba1715a9"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, dagrun_id=scheduled__2022-11-10T07:12:53.294512+00:00, map_index=-1, run_start_date=2022-11-10 11:13:56.657454+00:00, try_number=4, job_id=2988, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 07:12:53.294512+00:00 +INFO - Started process 2213 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskLoad', 'scheduled__2022-11-10T07:12:53.294512+00:00', '--job-id', '2988', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpmp1wg11x'] +INFO - Job 2988: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host d1b6a3478c83 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T07:12:53.294512+00:00 +AIRFLOW_CTX_TRY_NUMBER=4 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T07:12:53.294512+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-10' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-10' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTP connection (1): 169.254.169.254:80 +INFO - '2022-11-10' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTP connection (2): 169.254.169.254:80 +INFO - '2022-11-10' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-10' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-10' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f228eeb24c0> +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-10' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-10' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/dipa-s3/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'wsFSCtxe3weEe96IU5LOZg==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/dipa-s3/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'dipa-s3'}}} +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-10' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/dipa-s3/GBUNSalvador_process.txt +INFO - '2022-11-10' - botocore.utils - URI updated to: https://dipa-s3.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-10' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 898, in _make_api_call + http, parsed_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 921, in _make_request + return self._endpoint.make_request(operation_model, request_dict) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 119, in make_request + return self._send_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 198, in _send_request + request = self.create_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 134, in create_request + self._event_emitter.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 103, in handler + return self.sign(operation_name, request) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 187, in sign + auth.add_auth(request) + File "/usr/local/lib/python3.9/site-packages/botocore/auth.py", line 407, in add_auth + raise NoCredentialsError() +botocore.exceptions.NoCredentialsError: Unable to locate credentials +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNSalvador_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 898, in _make_api_call + http, parsed_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 921, in _make_request + return self._endpoint.make_request(operation_model, request_dict) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 119, in make_request + return self._send_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 198, in _send_request + request = self.create_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 134, in create_request + self._event_emitter.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 103, in handler + return self.sign(operation_name, request) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 187, in sign + auth.add_auth(request) + File "/usr/local/lib/python3.9/site-packages/botocore/auth.py", line 407, in add_auth + raise NoCredentialsError() +botocore.exceptions.NoCredentialsError: Unable to locate credentials +INFO - Marking task as UP_FOR_RETRY. dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, execution_date=20221110T071253, start_date=20221110T111356, end_date=20221110T111357 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 2988 for task TaskLoad (Unable to locate credentials; 2213) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T07\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskLoad/attempt=5.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T07\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskLoad/attempt=5.log" new file mode 100644 index 00000000..02f90134 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T07\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskLoad/attempt=5.log" @@ -0,0 +1,169 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 5 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T11:24:33.751210Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T07:12:53.294512Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "52cc4219-6c84-325f-bc49-6c6549866965"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "52cc4219-6c84-325f-bc49-6c6549866965"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3d8fbaf1-1088-4fb2-8ae6-fe052f652691"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, dagrun_id=scheduled__2022-11-10T07:12:53.294512+00:00, map_index=-1, run_start_date=2022-11-10 11:24:33.751210+00:00, try_number=5, job_id=2998, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 07:12:53.294512+00:00 +INFO - Started process 182 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskLoad', 'scheduled__2022-11-10T07:12:53.294512+00:00', '--job-id', '2998', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpbgjcpkq_'] +INFO - Job 2998: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 34b830a2c34f +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T07:12:53.294512+00:00 +AIRFLOW_CTX_TRY_NUMBER=5 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T07:12:53.294512+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-10' - GBUNSalvador_dag_elt - alkemy-2022-broc +INFO - '2022-11-10' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-10' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f64ee3f8e50> +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-10' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-10' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '5tSMZQaqcrCzCddBSibreQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-10' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-10' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-10' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-10' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:5tSMZQaqcrCzCddBSibreQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221110T112438Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-10' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221110T112438Z +20221110/us-east-1/s3/aws4_request +7fd0f97f5183259ae1c4789c98a47319e4586f596a479e5d2074e0ba4ee611f3 +INFO - '2022-11-10' - botocore.auth - Signature: +c49be21cd99501659dd08f57d91088edb6059b0445c2121f6c7e4e86d2585a12 +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Sending http request: +INFO - '2022-11-10' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTPS connection (1): alkemy-2022-broc.s3.amazonaws.com:443 +INFO - '2022-11-10' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-10' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-10' - urllib3.connectionpool - https://alkemy-2022-broc.s3.amazonaws.com:443 "PUT /GBUNSalvador_process.txt HTTP/1.1" 503 None +INFO - '2022-11-10' - botocore.parsers - Response headers: {'x-amz-request-id': '1SEF3FBP2K8MZDM2', 'x-amz-id-2': 'ebV0KlyhWJvLhy1TxoXuDJlqOItg9unNjP6sXIs6r07NPBk/oXzESoi2x+n0UP8yS0CRX9A7fV8vrYuEQnTKsw==', 'Content-Type': 'application/xml', 'Transfer-Encoding': 'chunked', 'Date': 'Thu, 10 Nov 2022 11:24:39 GMT', 'Server': 'AmazonS3', 'Connection': 'close'} +INFO - '2022-11-10' - botocore.parsers - Response body: +b'\nSlowDownPlease reduce your request rate.1SEF3FBP2K8MZDM2ebV0KlyhWJvLhy1TxoXuDJlqOItg9unNjP6sXIs6r07NPBk/oXzESoi2x+n0UP8yS0CRX9A7fV8vrYuEQnTKsw==' +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.retryhandler - retry needed: retryable HTTP status code received: 503 +INFO - '2022-11-10' - botocore.retryhandler - Retry needed, action of: 0.23958077900129016 +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.endpoint - Response received to retry, sleeping for 0.23958077900129016 seconds +INFO - '2022-11-10' - botocore.awsrequest - Rewinding stream: +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-10' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-10' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-10' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:5tSMZQaqcrCzCddBSibreQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221110T112441Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-10' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221110T112441Z +20221110/us-east-1/s3/aws4_request +071328219f3ec2b1fbda6c701cc264c481ae9c576826860447914abaafca9f4e +INFO - '2022-11-10' - botocore.auth - Signature: +761f7fece7e6f47f955a3494d5a68a3868711e1b071d97363c1b2e8e8963317b +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Sending http request: +INFO - '2022-11-10' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-10' - urllib3.connectionpool - Resetting dropped connection: alkemy-2022-broc.s3.amazonaws.com +INFO - '2022-11-10' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-10' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-10' - urllib3.connectionpool - https://alkemy-2022-broc.s3.amazonaws.com:443 "PUT /GBUNSalvador_process.txt HTTP/1.1" 200 0 +INFO - '2022-11-10' - botocore.parsers - Response headers: {'x-amz-id-2': '5HZD7H77KntQK5LbycmWzwc9e4O5SMd2iofBxms9j2bYkgoedfSiy2CaSqlJadsoMrbzax1s7C488zpIPvwY2g==', 'x-amz-request-id': 'JRJPB56KD1WDNTRT', 'Date': 'Thu, 10 Nov 2022 11:24:41 GMT', 'ETag': '"e6d48c6506aa72b0b309d7414a26eb79"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-10' - botocore.parsers - Response body: +b'' +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.retryhandler - No retry needed. +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, execution_date=20221110T071253, start_date=20221110T112433, end_date=20221110T112442 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskLoad airflow_run_id=scheduled__2022-11-10T07:12:53.294512+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskLoad: TaskMetadata(name='GBUNSalvador_dag_elt.TaskLoad', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskLoad', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskLoad', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskTransform'}, 'downstream_task_ids': set(), 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T11:24:42.365885Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "3d8fbaf1-1088-4fb2-8ae6-fe052f652691"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T07\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskTransform/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T07\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskTransform/attempt=1.log" new file mode 100644 index 00000000..414a9ea5 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T07\357\200\27212\357\200\27253.294512+00\357\200\27200/task_id=TaskTransform/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T08:12:59.879430Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskLoad'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskExtract'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T07:12:53.294512Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "52cc4219-6c84-325f-bc49-6c6549866965"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "52cc4219-6c84-325f-bc49-6c6549866965"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "aeaa94c3-a92b-460f-b4f3-7e91678ae35f"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskTransform, dagrun_id=scheduled__2022-11-10T07:12:53.294512+00:00, map_index=-1, run_start_date=2022-11-10 08:12:59.879430+00:00, try_number=1, job_id=622, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 07:12:53.294512+00:00 +INFO - Started process 2670 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskTransform', 'scheduled__2022-11-10T07:12:53.294512+00:00', '--job-id', '622', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmp06jjx38e'] +INFO - Job 622: Subtask TaskTransform +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host d1b6a3478c83 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskTransform +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T07:12:53.294512+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T07:12:53.294512+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Transform +INFO - ['GBUNSalvador', 'select.csv'] +INFO - GBUNSalvador +INFO - GBUNSalvador_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskTransform, execution_date=20221110T071253, start_date=20221110T081259, end_date=20221110T081303 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskTransform airflow_run_id=scheduled__2022-11-10T07:12:53.294512+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskTransform: TaskMetadata(name='GBUNSalvador_dag_elt.TaskTransform', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskTransform', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskTransform', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskExtract'}, 'downstream_task_ids': {'TaskLoad'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T08:13:03.516073Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "aeaa94c3-a92b-460f-b4f3-7e91678ae35f"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T09\357\200\27239\357\200\27245.202232+00\357\200\27200/task_id=TaskExtract/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T09\357\200\27239\357\200\27245.202232+00\357\200\27200/task_id=TaskExtract/attempt=1.log" new file mode 100644 index 00000000..e7810296 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T09\357\200\27239\357\200\27245.202232+00\357\200\27200/task_id=TaskExtract/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T11:03:53.803601Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T09:39:45.202232Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "64e3cc4e-86f3-343c-b670-b191ad6cdf79"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "64e3cc4e-86f3-343c-b670-b191ad6cdf79"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "942176e1-5790-4e20-8e46-43835595a90c"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, dagrun_id=scheduled__2022-11-10T09:39:45.202232+00:00, map_index=-1, run_start_date=2022-11-10 11:03:53.803601+00:00, try_number=1, job_id=2982, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 09:39:45.202232+00:00 +INFO - Started process 2132 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskExtract', 'scheduled__2022-11-10T09:39:45.202232+00:00', '--job-id', '2982', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpdqbyjudh'] +INFO - Job 2982: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host d1b6a3478c83 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T09:39:45.202232+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T09:39:45.202232+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNSalvador_dag_elt.py", line 52, in extract + conn = hook.get_conn() + File "/usr/local/lib/python3.9/site-packages/airflow/providers/postgres/hooks/postgres.py", line 115, in get_conn + self.conn = psycopg2.connect(**conn_args) + File "/usr/local/lib/python3.9/site-packages/psycopg2/__init__.py", line 122, in connect + conn = _connect(dsn, connection_factory=connection_factory, **kwasync) +psycopg2.OperationalError: could not translate host name "training-main.cghe7e6sfljt.us-east-1.rds.amazonaws.com" to address: Temporary failure in name resolution + +INFO - Marking task as UP_FOR_RETRY. dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, execution_date=20221110T093945, start_date=20221110T110353, end_date=20221110T110405 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 2982 for task TaskExtract (could not translate host name "training-main.cghe7e6sfljt.us-east-1.rds.amazonaws.com" to address: Temporary failure in name resolution +; 2132) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T09\357\200\27239\357\200\27245.202232+00\357\200\27200/task_id=TaskExtract/attempt=2.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T09\357\200\27239\357\200\27245.202232+00\357\200\27200/task_id=TaskExtract/attempt=2.log" new file mode 100644 index 00000000..982c9875 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T09\357\200\27239\357\200\27245.202232+00\357\200\27200/task_id=TaskExtract/attempt=2.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 2 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T11:14:06.533999Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T09:39:45.202232Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "64e3cc4e-86f3-343c-b670-b191ad6cdf79"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "64e3cc4e-86f3-343c-b670-b191ad6cdf79"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f0a79440-f207-45d0-874c-5ed3d3dd51c1"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, dagrun_id=scheduled__2022-11-10T09:39:45.202232+00:00, map_index=-1, run_start_date=2022-11-10 11:14:06.533999+00:00, try_number=2, job_id=2989, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 09:39:45.202232+00:00 +INFO - Started process 2224 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskExtract', 'scheduled__2022-11-10T09:39:45.202232+00:00', '--job-id', '2989', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpts5blp6i'] +INFO - Job 2989: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host d1b6a3478c83 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T09:39:45.202232+00:00 +AIRFLOW_CTX_TRY_NUMBER=2 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T09:39:45.202232+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-10' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, execution_date=20221110T093945, start_date=20221110T111406, end_date=20221110T111410 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskExtract airflow_run_id=scheduled__2022-11-10T09:39:45.202232+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskExtract: TaskMetadata(name='GBUNSalvador_dag_elt.TaskExtract', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskExtract', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskExtract', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'TaskTransform'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T11:14:10.897767Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "f0a79440-f207-45d0-874c-5ed3d3dd51c1"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T09\357\200\27239\357\200\27245.202232+00\357\200\27200/task_id=TaskLoad/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T09\357\200\27239\357\200\27245.202232+00\357\200\27200/task_id=TaskLoad/attempt=1.log" new file mode 100644 index 00000000..d80f1895 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T09\357\200\27239\357\200\27245.202232+00\357\200\27200/task_id=TaskLoad/attempt=1.log" @@ -0,0 +1,291 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T11:14:27.938372Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T09:39:45.202232Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "64e3cc4e-86f3-343c-b670-b191ad6cdf79"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "64e3cc4e-86f3-343c-b670-b191ad6cdf79"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "efeb83a4-aca7-4ba3-a9e8-b18d5ff9a0b3"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, dagrun_id=scheduled__2022-11-10T09:39:45.202232+00:00, map_index=-1, run_start_date=2022-11-10 11:14:27.938372+00:00, try_number=1, job_id=2994, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 09:39:45.202232+00:00 +INFO - Started process 2250 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskLoad', 'scheduled__2022-11-10T09:39:45.202232+00:00', '--job-id', '2994', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpnezym675'] +INFO - Job 2994: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host d1b6a3478c83 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T09:39:45.202232+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T09:39:45.202232+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-10' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-10' - botocore.utils - IMDS ENDPOINT: http://169.254.169.254/ +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: env +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: assume-role +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: assume-role-with-web-identity +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: sso +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: shared-credentials-file +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: custom-process +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: config-file +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: ec2-credentials-file +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: boto-config +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: container-role +INFO - '2022-11-10' - botocore.credentials - Looking for credentials via: iam-role +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTP connection (1): 169.254.169.254:80 +INFO - '2022-11-10' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/api/token: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 454, in _fetch_metadata_token + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/api/token" +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTP connection (2): 169.254.169.254:80 +INFO - '2022-11-10' - botocore.utils - Caught retryable HTTP exception while making metadata service request to http://169.254.169.254/latest/meta-data/iam/security-credentials/: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 174, in _new_conn + conn = connection.create_connection( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 95, in create_connection + raise err + File "/usr/local/lib/python3.9/site-packages/urllib3/util/connection.py", line 85, in create_connection + sock.connect(sa) +ConnectionRefusedError: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 448, in send + urllib_response = conn.urlopen( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 787, in urlopen + retries = retries.increment( + File "/usr/local/lib/python3.9/site-packages/urllib3/util/retry.py", line 525, in increment + raise six.reraise(type(error), error, _stacktrace) + File "/usr/local/lib/python3.9/site-packages/urllib3/packages/six.py", line 770, in reraise + raise value + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 703, in urlopen + httplib_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/urllib3/connectionpool.py", line 398, in _make_request + conn.request(method, url, **httplib_request_kw) + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 239, in request + super(HTTPConnection, self).request(method, url, body=body, headers=headers) + File "/usr/local/lib/python3.9/http/client.py", line 1285, in request + self._send_request(method, url, body, headers, encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 94, in _send_request + rval = super()._send_request( + File "/usr/local/lib/python3.9/http/client.py", line 1331, in _send_request + self.endheaders(body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/http/client.py", line 1280, in endheaders + self._send_output(message_body, encode_chunked=encode_chunked) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 123, in _send_output + self.send(msg) + File "/usr/local/lib/python3.9/site-packages/botocore/awsrequest.py", line 218, in send + return super().send(str) + File "/usr/local/lib/python3.9/http/client.py", line 980, in send + self.connect() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 205, in connect + conn = self._new_conn() + File "/usr/local/lib/python3.9/site-packages/urllib3/connection.py", line 186, in _new_conn + raise NewConnectionError( +urllib3.exceptions.NewConnectionError: : Failed to establish a new connection: [Errno 111] Connection refused + +During handling of the above exception, another exception occurred: + +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/botocore/utils.py", line 507, in _get_request + response = self._session.send(request.prepare()) + File "/usr/local/lib/python3.9/site-packages/botocore/httpsession.py", line 477, in send + raise EndpointConnectionError(endpoint_url=request.url, error=e) +botocore.exceptions.EndpointConnectionError: Could not connect to the endpoint URL: "http://169.254.169.254/latest/meta-data/iam/security-credentials/" +INFO - '2022-11-10' - botocore.utils - Max number of attempts exceeded (1) when attempting to retrieve data from metadata service. +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-10' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f228ee5e820> +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-10' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-10' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'dipa-s3', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/dipa-s3/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '5tSMZQaqcrCzCddBSibreQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/dipa-s3/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'dipa-s3'}}} +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-10' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/dipa-s3/GBUNSalvador_process.txt +INFO - '2022-11-10' - botocore.utils - URI updated to: https://dipa-s3.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-10' - s3transfer.tasks - Exception raised. +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 898, in _make_api_call + http, parsed_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 921, in _make_request + return self._endpoint.make_request(operation_model, request_dict) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 119, in make_request + return self._send_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 198, in _send_request + request = self.create_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 134, in create_request + self._event_emitter.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 103, in handler + return self.sign(operation_name, request) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 187, in sign + auth.add_auth(request) + File "/usr/local/lib/python3.9/site-packages/botocore/auth.py", line 407, in add_auth + raise NoCredentialsError() +botocore.exceptions.NoCredentialsError: Unable to locate credentials +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +ERROR - Task failed with exception +Traceback (most recent call last): + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 175, in execute + return_value = self.execute_callable() + File "/usr/local/lib/python3.9/site-packages/airflow/operators/python.py", line 193, in execute_callable + return self.python_callable(*self.op_args, **self.op_kwargs) + File "/usr/local/airflow/dags/GBUNSalvador_dag_elt.py", line 109, in load + response = s3_client.upload_file(file_name, bucket, object_name) + File "/usr/local/lib/python3.9/site-packages/boto3/s3/inject.py", line 143, in upload_file + return transfer.upload_file( + File "/usr/local/lib/python3.9/site-packages/boto3/s3/transfer.py", line 288, in upload_file + future.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 103, in result + return self._coordinator.result() + File "/usr/local/lib/python3.9/site-packages/s3transfer/futures.py", line 266, in result + raise self._exception + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 139, in __call__ + return self._execute_main(kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/tasks.py", line 162, in _execute_main + return_value = self._main(**kwargs) + File "/usr/local/lib/python3.9/site-packages/s3transfer/upload.py", line 758, in _main + client.put_object(Bucket=bucket, Key=key, Body=body, **extra_args) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 508, in _api_call + return self._make_api_call(operation_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 898, in _make_api_call + http, parsed_response = self._make_request( + File "/usr/local/lib/python3.9/site-packages/botocore/client.py", line 921, in _make_request + return self._endpoint.make_request(operation_model, request_dict) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 119, in make_request + return self._send_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 198, in _send_request + request = self.create_request(request_dict, operation_model) + File "/usr/local/lib/python3.9/site-packages/botocore/endpoint.py", line 134, in create_request + self._event_emitter.emit( + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 412, in emit + return self._emitter.emit(aliased_event_name, **kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 256, in emit + return self._emit(event_name, kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/hooks.py", line 239, in _emit + response = handler(**kwargs) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 103, in handler + return self.sign(operation_name, request) + File "/usr/local/lib/python3.9/site-packages/botocore/signers.py", line 187, in sign + auth.add_auth(request) + File "/usr/local/lib/python3.9/site-packages/botocore/auth.py", line 407, in add_auth + raise NoCredentialsError() +botocore.exceptions.NoCredentialsError: Unable to locate credentials +INFO - Marking task as UP_FOR_RETRY. dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, execution_date=20221110T093945, start_date=20221110T111427, end_date=20221110T111429 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +ERROR - Failed to execute job 2994 for task TaskLoad (Unable to locate credentials; 2250) +INFO - Task exited with return code 1 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T09\357\200\27239\357\200\27245.202232+00\357\200\27200/task_id=TaskLoad/attempt=2.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T09\357\200\27239\357\200\27245.202232+00\357\200\27200/task_id=TaskLoad/attempt=2.log" new file mode 100644 index 00000000..77550aa9 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T09\357\200\27239\357\200\27245.202232+00\357\200\27200/task_id=TaskLoad/attempt=2.log" @@ -0,0 +1,125 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 2 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T11:24:33.780299Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T09:39:45.202232Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "64e3cc4e-86f3-343c-b670-b191ad6cdf79"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "64e3cc4e-86f3-343c-b670-b191ad6cdf79"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ba21a020-fc65-4fb8-841c-89df8ad86490"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, dagrun_id=scheduled__2022-11-10T09:39:45.202232+00:00, map_index=-1, run_start_date=2022-11-10 11:24:33.780299+00:00, try_number=2, job_id=2999, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 09:39:45.202232+00:00 +INFO - Started process 183 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskLoad', 'scheduled__2022-11-10T09:39:45.202232+00:00', '--job-id', '2999', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpuhu1brsd'] +INFO - Job 2999: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 34b830a2c34f +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T09:39:45.202232+00:00 +AIRFLOW_CTX_TRY_NUMBER=2 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T09:39:45.202232+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-10' - GBUNSalvador_dag_elt - alkemy-2022-broc +INFO - '2022-11-10' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-10' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f64ee3f8e50> +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-10' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-10' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': '5tSMZQaqcrCzCddBSibreQ==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-10' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-10' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-10' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-10' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:5tSMZQaqcrCzCddBSibreQ== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221110T112438Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-10' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221110T112438Z +20221110/us-east-1/s3/aws4_request +7fd0f97f5183259ae1c4789c98a47319e4586f596a479e5d2074e0ba4ee611f3 +INFO - '2022-11-10' - botocore.auth - Signature: +c49be21cd99501659dd08f57d91088edb6059b0445c2121f6c7e4e86d2585a12 +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Sending http request: +INFO - '2022-11-10' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTPS connection (1): alkemy-2022-broc.s3.amazonaws.com:443 +INFO - '2022-11-10' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-10' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-10' - urllib3.connectionpool - https://alkemy-2022-broc.s3.amazonaws.com:443 "PUT /GBUNSalvador_process.txt HTTP/1.1" 200 0 +INFO - '2022-11-10' - botocore.parsers - Response headers: {'x-amz-id-2': '65/2BwbP0jZM9snkh2RitsVasQQgMW1+rKCaCKJsQft80q2rKIUeP4ZXPB3uW/D6zy9PIbwEzEsfo4LSqlJdhw==', 'x-amz-request-id': '1SE40TJTC1GAV2YX', 'Date': 'Thu, 10 Nov 2022 11:24:39 GMT', 'ETag': '"e6d48c6506aa72b0b309d7414a26eb79"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-10' - botocore.parsers - Response body: +b'' +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.retryhandler - No retry needed. +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, execution_date=20221110T093945, start_date=20221110T112433, end_date=20221110T112440 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskLoad airflow_run_id=scheduled__2022-11-10T09:39:45.202232+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskLoad: TaskMetadata(name='GBUNSalvador_dag_elt.TaskLoad', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskLoad', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskLoad', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskTransform'}, 'downstream_task_ids': set(), 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T11:24:40.770687Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "ba21a020-fc65-4fb8-841c-89df8ad86490"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T09\357\200\27239\357\200\27245.202232+00\357\200\27200/task_id=TaskTransform/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T09\357\200\27239\357\200\27245.202232+00\357\200\27200/task_id=TaskTransform/attempt=1.log" new file mode 100644 index 00000000..0ce62a01 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T09\357\200\27239\357\200\27245.202232+00\357\200\27200/task_id=TaskTransform/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T11:14:12.576656Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskLoad'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskExtract'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T09:39:45.202232Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "64e3cc4e-86f3-343c-b670-b191ad6cdf79"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "64e3cc4e-86f3-343c-b670-b191ad6cdf79"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "39bdae3d-1dce-4fca-ada0-c765eb9dcc05"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskTransform, dagrun_id=scheduled__2022-11-10T09:39:45.202232+00:00, map_index=-1, run_start_date=2022-11-10 11:14:12.576656+00:00, try_number=1, job_id=2991, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 09:39:45.202232+00:00 +INFO - Started process 2233 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskTransform', 'scheduled__2022-11-10T09:39:45.202232+00:00', '--job-id', '2991', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpsvlz3q1v'] +INFO - Job 2991: Subtask TaskTransform +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host d1b6a3478c83 +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskTransform +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T09:39:45.202232+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T09:39:45.202232+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Transform +INFO - ['GBUNSalvador', 'select.csv'] +INFO - GBUNSalvador +INFO - GBUNSalvador_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskTransform, execution_date=20221110T093945, start_date=20221110T111412, end_date=20221110T111425 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskTransform airflow_run_id=scheduled__2022-11-10T09:39:45.202232+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskTransform: TaskMetadata(name='GBUNSalvador_dag_elt.TaskTransform', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskTransform', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskTransform', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskExtract'}, 'downstream_task_ids': {'TaskLoad'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T11:14:25.983106Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "39bdae3d-1dce-4fca-ada0-c765eb9dcc05"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T10\357\200\27224\357\200\27242.819313+00\357\200\27200/task_id=TaskExtract/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T10\357\200\27224\357\200\27242.819313+00\357\200\27200/task_id=TaskExtract/attempt=1.log" new file mode 100644 index 00000000..cb417073 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T10\357\200\27224\357\200\27242.819313+00\357\200\27200/task_id=TaskExtract/attempt=1.log" @@ -0,0 +1,48 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T11:24:45.363789Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskTransform'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": "set()", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T10:24:42.819313Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "0270ed4d-d8a2-3d89-b3e2-80bb94100b3b"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "0270ed4d-d8a2-3d89-b3e2-80bb94100b3b"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e4ff1a19-f3c0-46b3-9ff6-12b001ed3ae3"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, dagrun_id=scheduled__2022-11-10T10:24:42.819313+00:00, map_index=-1, run_start_date=2022-11-10 11:24:45.363789+00:00, try_number=1, job_id=3006, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 10:24:42.819313+00:00 +INFO - Started process 222 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskExtract', 'scheduled__2022-11-10T10:24:42.819313+00:00', '--job-id', '3006', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmp3rmn2mdx'] +INFO - Job 3006: Subtask TaskExtract +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 34b830a2c34f +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskExtract +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T10:24:42.819313+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T10:24:42.819313+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Extract +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: alkemy_db +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +INFO - '2022-11-10' - airflow.hooks.base - Using connection ID 'alkemy_db' for task execution. +WARNING - /usr/local/lib/python3.9/site-packages/airflow/providers/common/sql/hooks/sql.py:176 UserWarning: pandas only supports SQLAlchemy connectable (engine/connection) or database string URI or sqlite3 DBAPI2 connection. Other DBAPI2 objects are not tested. Please consider using SQLAlchemy. +INFO - '2022-11-10' - GBUNSalvador_dag_elt - universidad ... email +0 UNIVERSIDAD_DEL_SALVADOR ... ANTHONY88@GMAIL.COM +1 UNIVERSIDAD_DEL_SALVADOR ... TODD44@HOTMAIL.COM +2 UNIVERSIDAD_DEL_SALVADOR ... ZCANTRELL@YAHOO.COM +3 UNIVERSIDAD_DEL_SALVADOR ... HEATHER60@GMAIL.COM +4 UNIVERSIDAD_DEL_SALVADOR ... BWARNER@GMAIL.COM + +[5 rows x 8 columns] +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskExtract, execution_date=20221110T102442, start_date=20221110T112445, end_date=20221110T112450 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskExtract airflow_run_id=scheduled__2022-11-10T10:24:42.819313+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskExtract: TaskMetadata(name='GBUNSalvador_dag_elt.TaskExtract', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskExtract', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskExtract', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': set(), 'downstream_task_ids': {'TaskTransform'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T11:24:50.743902Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskExtract", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskExtract"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskExtract", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "e4ff1a19-f3c0-46b3-9ff6-12b001ed3ae3"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T10\357\200\27224\357\200\27242.819313+00\357\200\27200/task_id=TaskLoad/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T10\357\200\27224\357\200\27242.819313+00\357\200\27200/task_id=TaskLoad/attempt=1.log" new file mode 100644 index 00000000..56ae94ab --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T10\357\200\27224\357\200\27242.819313+00\357\200\27200/task_id=TaskLoad/attempt=1.log" @@ -0,0 +1,125 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T11:25:13.994708Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "set()", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskTransform'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T10:24:42.819313Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "0270ed4d-d8a2-3d89-b3e2-80bb94100b3b"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "0270ed4d-d8a2-3d89-b3e2-80bb94100b3b"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a58d7a98-0eed-4545-9bee-cae7b8f88d22"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, dagrun_id=scheduled__2022-11-10T10:24:42.819313+00:00, map_index=-1, run_start_date=2022-11-10 11:25:13.994708+00:00, try_number=1, job_id=3021, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 10:24:42.819313+00:00 +INFO - Started process 306 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskLoad', 'scheduled__2022-11-10T10:24:42.819313+00:00', '--job-id', '3021', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpuw61vg1k'] +INFO - Job 3021: Subtask TaskLoad +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 34b830a2c34f +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskLoad +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T10:24:42.819313+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T10:24:42.819313+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Load: GBUNSalvador_dag_elt +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Connect: aws_s3_bucket +INFO - '2022-11-10' - GBUNSalvador_dag_elt - alkemy-2022-broc +INFO - '2022-11-10' - botocore.hooks - Changing event name from creating-client-class.iot-data to creating-client-class.iot-data-plane +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-call.apigateway to before-call.api-gateway +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.machinelearning.Predict to request-created.machine-learning.Predict +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.autoscaling.CreateLaunchConfiguration to before-parameter-build.auto-scaling.CreateLaunchConfiguration +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.route53 to before-parameter-build.route-53 +INFO - '2022-11-10' - botocore.hooks - Changing event name from request-created.cloudsearchdomain.Search to request-created.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.autoscaling.CreateLaunchConfiguration.complete-section to docs.*.auto-scaling.CreateLaunchConfiguration.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.logs.CreateExportTask to before-parameter-build.cloudwatch-logs.CreateExportTask +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.logs.CreateExportTask.complete-section to docs.*.cloudwatch-logs.CreateExportTask.complete-section +INFO - '2022-11-10' - botocore.hooks - Changing event name from before-parameter-build.cloudsearchdomain.Search to before-parameter-build.cloudsearch-domain.Search +INFO - '2022-11-10' - botocore.hooks - Changing event name from docs.*.cloudsearchdomain.Search.complete-section to docs.*.cloudsearch-domain.Search.complete-section +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/endpoints.json +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/sdk-default-configuration.json +INFO - '2022-11-10' - botocore.hooks - Event choose-service-name: calling handler +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/s3/2006-03-01/service-2.json +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler ._handler at 0x7f64ee386700> +INFO - '2022-11-10' - botocore.hooks - Event creating-client-class.s3: calling handler +INFO - '2022-11-10' - botocore.endpoint - Setting s3 timeout as (60, 60) +INFO - '2022-11-10' - botocore.loaders - Loading JSON file: /usr/local/lib/python3.9/site-packages/botocore/data/_retry.json +INFO - '2022-11-10' - botocore.client - Registering retry handlers for service: s3 +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.tasks - UploadSubmissionTask(transfer_id=0, {'transfer_future': }) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task UploadSubmissionTask(transfer_id=0, {'transfer_future': }) with kwargs {'client': , 'config': , 'osutil': , 'request_executor': , 'transfer_future': } +INFO - '2022-11-10' - s3transfer.futures - Submitting task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) to executor for transfer request: 0. +INFO - '2022-11-10' - s3transfer.utils - Acquiring 0 +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) about to wait for the following futures [] +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - '2022-11-10' - s3transfer.tasks - PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) done waiting for dependent futures +INFO - '2022-11-10' - s3transfer.tasks - Executing task PutObjectTask(transfer_id=0, {'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}}) with kwargs {'client': , 'fileobj': , 'bucket': 'alkemy-2022-broc', 'key': 'GBUNSalvador_process.txt', 'extra_args': {}} +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-parameter-build.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.handlers - Adding expect 100 continue header to request. +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-call.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Making request for OperationModel(name=PutObject) with params: {'url_path': '/alkemy-2022-broc/GBUNSalvador_process.txt', 'query_string': {}, 'method': 'PUT', 'headers': {'User-Agent': 'Boto3/1.24.59 Python/3.9.15 Linux/5.10.16.3-microsoft-standard-WSL2 Botocore/1.27.59', 'Content-MD5': 'kq5MtnEqxJhWjXmD2D7Hmw==', 'Expect': '100-continue'}, 'body': , 'url': 'https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt', 'context': {'client_region': 'us-east-1', 'client_config': , 'has_streaming_input': True, 'auth_type': None, 'signing': {'bucket': 'alkemy-2022-broc'}}} +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.hooks - Event choose-signer.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event before-sign.s3.PutObject: calling handler > +INFO - '2022-11-10' - botocore.utils - Defaulting to S3 virtual host style addressing with path style addressing fallback. +INFO - '2022-11-10' - botocore.utils - Checking for DNS compatible bucket for: https://s3.amazonaws.com/alkemy-2022-broc/GBUNSalvador_process.txt +INFO - '2022-11-10' - botocore.utils - URI updated to: https://alkemy-2022-broc.s3.amazonaws.com/GBUNSalvador_process.txt +INFO - '2022-11-10' - botocore.auth - Calculating signature using v4 auth. +INFO - '2022-11-10' - botocore.auth - CanonicalRequest: +PUT +/GBUNSalvador_process.txt + +content-md5:kq5MtnEqxJhWjXmD2D7Hmw== +host:alkemy-2022-broc.s3.amazonaws.com +x-amz-content-sha256:UNSIGNED-PAYLOAD +x-amz-date:20221110T112516Z + +content-md5;host;x-amz-content-sha256;x-amz-date +UNSIGNED-PAYLOAD +INFO - '2022-11-10' - botocore.auth - StringToSign: +AWS4-HMAC-SHA256 +20221110T112516Z +20221110/us-east-1/s3/aws4_request +aa94391d07177fc67dbbae1cebe6a59d534e448197f8b558f83caebb7d0495d0 +INFO - '2022-11-10' - botocore.auth - Signature: +7d355fdfa8b4190c90d631c592f8b914ba635fd15fbb212b2214e12c12baeb3d +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.hooks - Event request-created.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.endpoint - Sending http request: +INFO - '2022-11-10' - botocore.httpsession - Certificate path: /usr/local/lib/python3.9/site-packages/certifi/cacert.pem +INFO - '2022-11-10' - urllib3.connectionpool - Starting new HTTPS connection (1): alkemy-2022-broc.s3.amazonaws.com:443 +INFO - '2022-11-10' - botocore.awsrequest - Waiting for 100 Continue response. +INFO - '2022-11-10' - botocore.awsrequest - 100 Continue response seen, now sending request body. +INFO - '2022-11-10' - urllib3.connectionpool - https://alkemy-2022-broc.s3.amazonaws.com:443 "PUT /GBUNSalvador_process.txt HTTP/1.1" 200 0 +INFO - '2022-11-10' - botocore.parsers - Response headers: {'x-amz-id-2': 'wtfAN4aej5eCR0Mm8XYo3iXlQI4VM0RrpZ8KYDvalY1HIk2jxe9fQH2yFLwrAiHQIfKgBjK71mY=', 'x-amz-request-id': 'QABBPVPMERM8HX71', 'Date': 'Thu, 10 Nov 2022 11:25:16 GMT', 'ETag': '"92ae4cb6712ac498568d7983d83ec79b"', 'Server': 'AmazonS3', 'Content-Length': '0'} +INFO - '2022-11-10' - botocore.parsers - Response body: +b'' +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler +INFO - '2022-11-10' - botocore.retryhandler - No retry needed. +INFO - '2022-11-10' - botocore.hooks - Event needs-retry.s3.PutObject: calling handler > +INFO - '2022-11-10' - s3transfer.utils - Releasing acquire 0/None +INFO - Done. Returned value was: True +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskLoad, execution_date=20221110T102442, start_date=20221110T112513, end_date=20221110T112517 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskLoad airflow_run_id=scheduled__2022-11-10T10:24:42.819313+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskLoad: TaskMetadata(name='GBUNSalvador_dag_elt.TaskLoad', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskLoad', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskLoad', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskTransform'}, 'downstream_task_ids': set(), 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T11:25:17.870024Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskLoad", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskLoad"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskLoad", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "a58d7a98-0eed-4545-9bee-cae7b8f88d22"}} +INFO - Task exited with return code 0 +INFO - 0 downstream tasks scheduled from follow-on schedule check diff --git "a/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T10\357\200\27224\357\200\27242.819313+00\357\200\27200/task_id=TaskTransform/attempt=1.log" "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T10\357\200\27224\357\200\27242.819313+00\357\200\27200/task_id=TaskTransform/attempt=1.log" new file mode 100644 index 00000000..925ad9a6 --- /dev/null +++ "b/dags/logs/dag_id=GBUNSalvador_dag_elt/run_id=scheduled__2022-11-10T10\357\200\27224\357\200\27242.819313+00\357\200\27200/task_id=TaskTransform/attempt=1.log" @@ -0,0 +1,38 @@ +INFO - Dependencies all met for +INFO - Dependencies all met for +INFO - +-------------------------------------------------------------------------------- +INFO - Starting attempt 1 of 6 +INFO - +-------------------------------------------------------------------------------- +ERROR - Did not find openlineage.yml and OPENLINEAGE_URL is not set +WARNING - Couldn't initialize transport; will print events to console. +INFO - {"eventTime": "2022-11-10T11:24:52.009029Z", "eventType": "START", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"airflow_runArgs": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "externalTrigger": false}, "airflow_version": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "airflowVersion": "2.4.2+astro.1", "openlineageAirflowVersion": "0.15.1", "operator": "airflow.operators.python.PythonOperator", "taskInfo": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "", "retries": 5, "retry_delay": "0:10:00", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": {"dag_id": "GBUNSalvador_dag_elt", "schedule_interval": "1:00:00", "tags": []}, "_log": "", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": "{'TaskLoad'}", "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "{}", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "", "queue": "default", "retries": 5, "retry_delay": "0:10:00", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "2022-11-04T00:00:00+00:00", "task_group": "", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": "{'TaskExtract'}", "wait_for_downstream": false, "weight_rule": "downstream"}}, "nominalTime": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/NominalTimeRunFacet", "nominalStartTime": "2022-11-10T10:24:42.819313Z"}, "parent": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "0270ed4d-d8a2-3d89-b3e2-80bb94100b3b"}}, "parentRun": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/ParentRunFacet", "job": {"name": "GBUNSalvador_dag_elt", "namespace": "default"}, "run": {"runId": "0270ed4d-d8a2-3d89-b3e2-80bb94100b3b"}}, "unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7e50f085-994b-4679-8ace-830f1edc01ca"}} +INFO - TaskInstance Details: dag_id=GBUNSalvador_dag_elt, task_id=TaskTransform, dagrun_id=scheduled__2022-11-10T10:24:42.819313+00:00, map_index=-1, run_start_date=2022-11-10 11:24:52.009029+00:00, try_number=1, job_id=3010, op_classpath=airflow.operators.python.PythonOperator +INFO - Executing on 2022-11-10 10:24:42.819313+00:00 +INFO - Started process 241 to run task +INFO - Running: ['airflow', 'tasks', 'run', 'GBUNSalvador_dag_elt', 'TaskTransform', 'scheduled__2022-11-10T10:24:42.819313+00:00', '--job-id', '3010', '--raw', '--subdir', 'DAGS_FOLDER/GBUNSalvador_dag_elt.py', '--cfg-path', '/tmp/tmpk1oazble'] +INFO - Job 3010: Subtask TaskTransform +WARNING - /usr/local/lib/python3.9/site-packages/airflow/configuration.py:545 DeprecationWarning: The sql_alchemy_conn option in [core] has been moved to the sql_alchemy_conn option in [database] - the old setting has been used, but please update your config. +INFO - Running on host 34b830a2c34f +INFO - Exporting the following env vars: +AIRFLOW_CTX_DAG_OWNER=Breyner +AIRFLOW_CTX_DAG_ID=GBUNSalvador_dag_elt +AIRFLOW_CTX_TASK_ID=TaskTransform +AIRFLOW_CTX_EXECUTION_DATE=2022-11-10T10:24:42.819313+00:00 +AIRFLOW_CTX_TRY_NUMBER=1 +AIRFLOW_CTX_DAG_RUN_ID=scheduled__2022-11-10T10:24:42.819313+00:00 +INFO - '2022-11-10' - GBUNSalvador_dag_elt - Transform +INFO - ['GBUNSalvador', 'select.csv'] +INFO - GBUNSalvador +INFO - GBUNSalvador_process.txt +INFO - Done. Returned value was: None +INFO - Marking task as SUCCESS. dag_id=GBUNSalvador_dag_elt, task_id=TaskTransform, execution_date=20221110T102442, start_date=20221110T112452, end_date=20221110T112511 +INFO - '2022-11-10' - airflow.listeners.events - session flush listener: added [] unchanged () deleted ['running'] - +INFO - '2022-11-10' - airflow - OpenLineage listener got notification about task instance success +INFO - '2022-11-10' - root - Using extractor PythonExtractor task_type=PythonOperator airflow_dag_id=GBUNSalvador_dag_elt task_id=TaskTransform airflow_run_id=scheduled__2022-11-10T10:24:42.819313+00:00 +INFO - '2022-11-10' - root - Found task metadata for operation TaskTransform: TaskMetadata(name='GBUNSalvador_dag_elt.TaskTransform', inputs=[], outputs=[], run_facets={'unknownSourceAttribute': UnknownOperatorAttributeRunFacet(_producer='https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow', _schemaURL='https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet', unknownItems=[UnknownOperatorInstance(name='PythonOperator', properties={'_BaseOperator__init_kwargs': {'task_id': 'TaskTransform', 'owner': 'Breyner', 'retries': 5, 'retry_delay': datetime.timedelta(seconds=600), 'python_callable': }, '_BaseOperator__from_mapped': False, 'task_id': 'TaskTransform', 'task_group': , 'owner': 'Breyner', 'email': None, 'email_on_retry': True, 'email_on_failure': True, 'execution_timeout': None, 'on_execute_callback': None, 'on_failure_callback': None, 'on_success_callback': None, 'on_retry_callback': None, '_pre_execute_hook': None, '_post_execute_hook': None, 'executor_config': {}, 'run_as_user': None, 'retries': 5, 'queue': 'default', 'pool': 'default_pool', 'pool_slots': 1, 'sla': None, 'trigger_rule': , 'depends_on_past': False, 'ignore_first_depends_on_past': True, 'wait_for_downstream': False, 'retry_delay': datetime.timedelta(seconds=600), 'retry_exponential_backoff': False, 'max_retry_delay': None, 'params': {}, 'priority_weight': 1, 'weight_rule': , 'resources': None, 'max_active_tis_per_dag': None, 'do_xcom_push': True, 'doc_md': None, 'doc_json': None, 'doc_yaml': None, 'doc_rst': None, 'doc': None, 'upstream_task_ids': {'TaskExtract'}, 'downstream_task_ids': {'TaskLoad'}, 'start_date': DateTime(2022, 11, 4, 0, 0, 0, tzinfo=Timezone('UTC')), 'end_date': None, '_dag': , '_log': , 'inlets': [], 'outlets': [], 'python_callable': , 'op_args': (), 'op_kwargs': {}, 'templates_dict': None, 'show_return_value_in_logs': True, '_BaseOperator__instantiated': True}, type='operator')])}, job_facets={}) +INFO - '2022-11-10' - root - Manually extracting lineage metadata from inlets and outlets +INFO - '2022-11-10' - openlineage.client.transport.console - {"eventTime": "2022-11-10T11:25:11.815598Z", "eventType": "COMPLETE", "inputs": [], "job": {"facets": {}, "name": "GBUNSalvador_dag_elt.TaskTransform", "namespace": "default"}, "outputs": [], "producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "run": {"facets": {"unknownSourceAttribute": {"_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.15.1/integration/airflow", "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/BaseFacet", "unknownItems": [{"name": "PythonOperator", "properties": {"_BaseOperator__from_mapped": false, "_BaseOperator__init_kwargs": {"owner": "Breyner", "python_callable": "<>", "retries": 5, "retry_delay": "<>", "task_id": "TaskTransform"}, "_BaseOperator__instantiated": true, "_dag": "<>", "_log": "<>", "depends_on_past": false, "do_xcom_push": true, "downstream_task_ids": [], "email_on_failure": true, "email_on_retry": true, "executor_config": {}, "ignore_first_depends_on_past": true, "inlets": [], "op_args": [], "op_kwargs": {}, "outlets": [], "owner": "Breyner", "params": "<>", "pool": "default_pool", "pool_slots": 1, "priority_weight": 1, "python_callable": "<>", "queue": "default", "retries": 5, "retry_delay": "<>", "retry_exponential_backoff": false, "show_return_value_in_logs": true, "start_date": "<>", "task_group": "<>", "task_id": "TaskTransform", "trigger_rule": "all_success", "upstream_task_ids": [], "wait_for_downstream": false, "weight_rule": "downstream"}, "type": "operator"}]}}, "runId": "7e50f085-994b-4679-8ace-830f1edc01ca"}} +INFO - Task exited with return code 0 +INFO - 1 downstream tasks scheduled from follow-on schedule check diff --git a/datasets/GBUNComahue_process.txt b/datasets/GBUNComahue_process.txt new file mode 100644 index 00000000..48d82d9f --- /dev/null +++ b/datasets/GBUNComahue_process.txt @@ -0,0 +1,1832 @@ +university career inscription_date first_name last_name gender age postal_code location email +univ. nacional del comahue licenciatura en psicología 2020-09-01 gregory howell male 29 5315 calera la norma frankalexandra@yahoo.com +univ. nacional del comahue farmacia 2020-09-01 tasha brown female 37 8305 aguada san roque tedwards@gmail.com +univ. nacional del comahue medicina 2020-09-01 ian taylor male 35 3428 estacion saladas richard76@gmail.com +univ. nacional del comahue medicina 2020-09-01 mark sanchez male 20 5873 isla oduffy@yahoo.com +univ. nacional del comahue licenciatura en ciencia política 2020-09-01 sherri carter female 39 1765 isidro casanova fosterchase@gmail.com +univ. nacional del comahue técnico para bioterios 2020-09-01 patricia gardner female 25 3197 abra guazu hughesnina@yahoo.com +univ. nacional del comahue licenciatura en sociología 2020-09-01 marissa johns female 34 6034 colonia alberdi john91@yahoo.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-09-01 crystal williams female 23 6017 chancay leebrad@yahoo.com +univ. nacional del comahue diseño industrial 2020-09-01 nicole smith female 21 1925 destileria fiscal jshields@yahoo.com +univ. nacional del comahue licenciatura en artes 2020-09-01 timothy dyer male 21 5429 el abanico mariajackson@hotmail.com +univ. nacional del comahue licenciatura en administración 2020-09-02 christina long female 21 4750 agua colorada williammcpherson@yahoo.com +univ. nacional del comahue contador público 2020-09-02 michele rivera female 19 2721 el arbolito ewingdiana@gmail.com +univ. nacional del comahue ciencias veterinarias 2020-09-02 steven may male 23 6437 alamos perezchristopher@yahoo.com +univ. nacional del comahue ingeniería mecánica 2020-09-02 mary larson female 33 7519 san mayol michaelwhite@yahoo.com +univ. nacional del comahue ingeniería en informática 2020-09-02 kenneth henry male 31 8170 abra de hinojo qyoung@hotmail.com +univ. nacional del comahue arquitectura 2020-09-02 carmen clark female 37 5741 13 de enero richardjohnson@gmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-09-02 haley carpenter female 33 3585 el sombrerito yshepherd@yahoo.com +univ. nacional del comahue licenciatura en musicoterapia 2020-09-02 angela simmons female 25 3158 20 de septiembre stonekimberly@yahoo.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-09-02 matthew wilson male 23 5835 bella vista campbelldavid@gmail.com +univ. nacional del comahue ingeniería mecánica 2020-09-02 john hernandez male 17 3172 kilometro 208 lisa58@gmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-09-02 joseph mccarthy male 36 2931 isla los laureles laurenchurch@hotmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-09-02 michael diaz male 25 5557 caracoles woodsydney@hotmail.com +univ. nacional del comahue farmacia 2020-09-02 shawn thomas male 34 5317 apoyaco william73@hotmail.com +univ. nacional del comahue ingeniería electrónica 2020-09-02 julie guerrero female 35 3109 colonia centenario warnershirley@gmail.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-09-02 melissa newton female 24 2527 colonia san francisco nelsonmegan@yahoo.com +univ. nacional del comahue diseño de imagen y sonido 2020-09-03 allen skinner male 36 6651 ingeniero de madrid marksmith@gmail.com +univ. nacional del comahue medicina 2020-09-03 erin jennings female 34 6307 colonia la oracion martinezstephanie@gmail.com +univ. nacional del comahue ingeniería mecánica 2020-09-03 stacey kidd female 23 2715 el socorro zsexton@hotmail.com +univ. nacional del comahue ingeniería en informática 2020-09-03 warren torres male 29 3111 almacen cristian schubert bishopkevin@hotmail.com +univ. nacional del comahue actuario 2020-09-03 natalie gilbert female 21 3134 antonio tomas sud cowanjennifer@gmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-09-03 margaret jimenez female 23 3192 colonia bertozzi jenniferthompson@yahoo.com +univ. nacional del comahue ingeniería en informática 2020-09-03 kristopher wright male 18 1842 el jaguel elliottashley@gmail.com +univ. nacional del comahue diseño de imagen y sonido 2020-09-03 todd warren male 33 2142 campo medina debra01@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-09-03 ian freeman male 17 2630 firmat joshuamorgan@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-09-04 alexis ford female 31 7400 barrio la luisa westtamara@gmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-09-04 dawn roberts female 19 6321 caichue manningbarbara@yahoo.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-09-04 jason montes male 23 3194 paso telegrafo wbryant@hotmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-09-04 jesse frazier male 19 6233 condarco matthew83@yahoo.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-09-04 anthony jackson male 23 8534 aguada cecilio williamstracy@yahoo.com +univ. nacional del comahue licenciatura en psicología 2020-09-04 sherri hester female 23 8347 arroyo cahunco donaldreilly@gmail.com +univ. nacional del comahue licenciatura en sociología 2020-09-04 anita martinez female 21 1890 juan maria gutierrez okelley@gmail.com +univ. nacional del comahue arquitectura 2020-09-04 andre gutierrez male 21 5600 agua de la mula jasonjones@hotmail.com +univ. nacional del comahue diseño industrial 2020-09-04 catherine may female 38 1664 trujui anthonyjohnson@hotmail.com +univ. nacional del comahue licenciatura en psicología 2020-09-04 jeffrey obrien male 25 3337 adolfo j pomar transcott@yahoo.com +univ. nacional del comahue licenciatura en ciencia política 2020-09-04 amanda hill female 33 8105 aguara gregorybaker@yahoo.com +univ. nacional del comahue licenciatura en psicología 2020-09-04 tracey anderson female 24 1927 esc nav militar rio sant srowe@gmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-09-04 angela gilmore female 18 3536 bocas johnsontara@hotmail.com +univ. nacional del comahue agronomía 2020-09-04 carla barnes female 31 5384 punta de los llanos hallian@gmail.com +univ. nacional del comahue ingeniería mecánica 2020-09-05 matthew frost male 25 6042 dos hermanos hparker@hotmail.com +univ. nacional del comahue farmacia 2020-09-05 zachary jackson male 27 6455 carlos tejedor rodriguezscott@hotmail.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-09-05 amy mendoza female 21 2508 armstrong chamberskevin@gmail.com +univ. nacional del comahue diseño industrial 2020-09-05 zachary obrien male 19 3366 almirante brown ryanlee@hotmail.com +univ. nacional del comahue farmacia 2020-09-05 craig richards male 27 5439 belgrano jennifer39@gmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-09-05 thomas brown male 29 1770 aldo bonzi lsanford@gmail.com +univ. nacional del comahue medicina 2020-09-05 leah branch female 19 4000 estacion de zootecnia b masonkevin@yahoo.com +univ. nacional del comahue ciencias veterinarias 2020-09-05 ashley scott female 29 4516 caimancito asimmons@yahoo.com +univ. nacional del comahue bioquímica 2020-09-05 frank robinson male 37 5596 12 de octubre pmanning@yahoo.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-09-05 kelli rivera female 31 8363 colonia josefa oyoung@hotmail.com +univ. nacional del comahue licenciatura en artes 2020-09-05 vicki phillips female 19 7011 aneque grande robertslisa@hotmail.com +univ. nacional del comahue diseño de imagen y sonido 2020-09-06 edward taylor male 25 9050 gobernador moyano whiteheadshane@hotmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-09-06 nicholas johnson male 27 3461 abo nezu ytorres@gmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-09-06 james petty male 19 5521 los corredores ethanjimenez@hotmail.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-09-06 jamie smith female 29 2216 campo raffo zachary24@yahoo.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-09-06 andrew myers male 29 7533 quiñihual estacion breannaward@yahoo.com +univ. nacional del comahue ingeniería en informática 2020-09-06 julia mills female 34 6503 desvio kilometro 234 kochrickey@hotmail.com +univ. nacional del comahue ingeniería mecánica 2020-09-06 catherine mann female 37 4230 brea chimpana katelynwest@hotmail.com +univ. nacional del comahue ingeniería en informática 2020-09-06 valerie hughes female 23 7203 chapaleufu smcdonald@gmail.com +univ. nacional del comahue ingeniería en informática 2020-09-07 richard brown male 21 1601 isla martin garcia chelsey16@hotmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-09-07 catherine bush female 20 2309 colonia reina margarita amandadoyle@gmail.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-09-07 nicholas vasquez male 33 2185 campo crenna nburgess@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-09-07 samantha ferguson female 19 2445 cristolia alyssamoore@hotmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-09-07 emily page female 37 2705 haras san jacinto robert29@hotmail.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-09-07 amanda diaz female 28 3344 2 de julio jefferydennis@hotmail.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-09-07 christine mayer female 33 2156 arsenal de guerra san lorenzo taylordana@yahoo.com +univ. nacional del comahue licenciatura en psicología 2020-09-07 david jones male 29 1842 el jaguel hernandezmegan@gmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-09-07 mark bradley male 39 2113 peyrano twebb@gmail.com +univ. nacional del comahue agronomía 2020-09-07 john bowen male 35 2824 britos rhart@gmail.com +univ. nacional del comahue actuario 2020-09-07 robert moreno male 29 3574 capilla guadalupe norte nwatson@yahoo.com +univ. nacional del comahue agronomía 2020-09-07 andrea alexander female 31 1896 camino centenario km 11500 christina09@gmail.com +univ. nacional del comahue agronomía 2020-09-07 felicia valdez female 25 3620 kilometro 184 greenefrederick@yahoo.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-09-07 michele romero female 25 1739 general hornos salinasjanice@yahoo.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-09-07 michael mosley male 27 6500 9 de julio donnajones@hotmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-09-07 charles leach male 33 5779 la chilca barbaraturner@yahoo.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-09-08 michael simpson male 35 6652 olascoaga davidgaines@yahoo.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-09-08 amanda jordan female 33 3522 el retiro robert92@gmail.com +univ. nacional del comahue licenciatura en psicología 2020-09-08 jessica ross female 27 6003 ascencion robert92@yahoo.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-09-08 darlene garner female 37 3366 almirante brown jmadden@hotmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-09-08 patrick garrett male 39 4186 cañete greenecharles@yahoo.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-09-08 zoe oconnell female 37 5419 baños de la laja jill45@gmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-09-08 michelle shelton female 17 3427 abra breweramber@gmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-09-08 megan mendoza female 37 3416 arroyo ceibal michellelynch@hotmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-09-08 joseph estrada male 27 6643 araujo oatkinson@gmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-09-09 jennifer may female 21 5474 barranquitas aaron63@gmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-09-09 jordan gilmore male 25 3472 caaguazu wspencer@hotmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-09-09 michael thompson male 30 2824 britos kimberly13@gmail.com +univ. nacional del comahue licenciatura en sociología 2020-09-09 james taylor male 27 2500 cañada de gomez sheenasilva@hotmail.com +univ. nacional del comahue arquitectura 2020-09-09 kim burton female 21 5438 alto de sierra rogersdavid@yahoo.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-09-09 tricia evans female 39 5589 chapanay millergregory@hotmail.com +univ. nacional del comahue farmacia 2020-09-09 kirk calderon male 25 2609 colonia morgan cpalmer@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-09-09 kimberly calderon female 25 3181 arroyo moreira ggraham@gmail.com +univ. nacional del comahue ciencias veterinarias 2020-09-09 erin reeves female 31 2854 dos hermanas timothyvega@yahoo.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-09-09 rachel newman female 38 1678 caseros oscarnielsen@yahoo.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-09-09 rachel lane female 37 5423 capitan lazo sandersbrandy@gmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-09-09 melvin castro male 17 2527 colonia san francisco keithglenn@gmail.com +univ. nacional del comahue medicina 2020-09-09 tricia mendoza female 33 6244 banderalo smithbryan@yahoo.com +univ. nacional del comahue técnico para bioterios 2020-09-09 brittany soto female 39 5511 general gutierrez dustin57@yahoo.com +univ. nacional del comahue licenciatura en administración 2020-09-09 regina reid female 25 5345 baños termales perrynoah@yahoo.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-09-10 stacy hall female 31 2828 colonia nueva montevideo zwalters@hotmail.com +univ. nacional del comahue bioquímica 2020-09-10 monica garcia female 34 6239 gonzalez moreno allison79@gmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-09-10 rodney neal male 21 1646 san fernando schmittanthony@hotmail.com +univ. nacional del comahue ciencias veterinarias 2020-09-10 melissa nelson female 23 6230 francisco casal amccormick@hotmail.com +univ. nacional del comahue actuario 2020-09-10 jason wyatt male 31 3216 arroyo hondo rlowe@gmail.com +univ. nacional del comahue contador público 2020-09-10 duane fowler male 35 1872 sarandi steven63@hotmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-09-10 katherine benson female 31 7118 general guido ujones@hotmail.com +univ. nacional del comahue agronomía 2020-09-10 john parks male 33 7165 faro querandi mbaldwin@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-09-10 erica hampton female 38 6700 caminera lujan carmenwarren@yahoo.com +univ. nacional del comahue farmacia 2020-09-10 sherry johnson female 35 5636 favelli janet27@hotmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-09-10 jack jackson male 35 8333 aguada guzman ejones@hotmail.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-09-10 tiffany contreras female 21 3203 arroyo grande daniellegraham@hotmail.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-09-10 jennifer fox female 25 3196 arroyo vega qstrickland@gmail.com +univ. nacional del comahue contador público 2020-09-10 steven smith male 23 1627 matheu kristin73@gmail.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-09-11 larry martinez male 33 3057 estancia las gamas peterhess@gmail.com +univ. nacional del comahue diseño de imagen y sonido 2020-09-11 theresa bentley female 31 1879 quilmes oeste holson@gmail.com +univ. nacional del comahue técnico para bioterios 2020-09-11 lisa vincent female 27 6667 agustin mosconi gomezjose@yahoo.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-09-11 jenny valdez female 21 6701 carlos keen wileyjacqueline@hotmail.com +univ. nacional del comahue ingeniería electrónica 2020-09-11 christopher gutierrez male 23 2121 perez jrush@gmail.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-09-11 amanda dyer female 21 2208 gaboto srodriguez@yahoo.com +univ. nacional del comahue ingeniería mecánica 2020-09-11 melissa wallace female 21 1870 avellaneda thomas12@gmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-09-11 mario rosales male 35 8424 aguada de guerra xcarroll@yahoo.com +univ. nacional del comahue farmacia 2020-09-11 haley adkins female 33 5444 ampacama garrisonstacie@yahoo.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-09-11 carlos johnson male 35 6614 franklin owengeorge@yahoo.com +univ. nacional del comahue licenciatura en ciencia política 2020-09-11 hannah ballard female 37 7249 el araza monique87@gmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-09-11 ronnie wood male 18 7169 juancho lewislisa@hotmail.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-09-11 steven fields male 29 1686 hurlingham brookewhite@yahoo.com +univ. nacional del comahue diseño industrial 2020-09-12 megan green female 23 2134 roldan heather75@yahoo.com +univ. nacional del comahue medicina 2020-09-12 richard sanchez male 37 5470 abra verde yyates@yahoo.com +univ. nacional del comahue medicina 2020-09-12 joel kelly male 34 9030 rio mayo christopher34@gmail.com +univ. nacional del comahue licenciatura en administración 2020-09-12 ashley schultz female 35 3234 bonpland fjimenez@yahoo.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-09-12 cassandra moore female 31 3183 albariño thompsonbrandon@yahoo.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-09-12 scott evans male 24 2812 capilla del señor markjackson@hotmail.com +univ. nacional del comahue actuario 2020-09-12 christopher lane male 27 2800 arroyo aguila negra ryan53@gmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-09-12 david miller male 35 2138 carcaraña deborahlewis@gmail.com +univ. nacional del comahue ingeniería en informática 2020-09-12 hannah moore female 27 1812 carlos spegazzini taylormikayla@hotmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-09-12 corey lindsey male 31 4109 alto nuestra señora del valle paigetrevino@yahoo.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-09-12 matthew gamble male 23 7150 ayacucho acarroll@yahoo.com +univ. nacional del comahue licenciatura en artes 2020-09-12 molly fowler female 25 8187 bordenave stephanie22@yahoo.com +univ. nacional del comahue actuario 2020-09-12 aaron roy male 31 1865 el pampero johnguzman@gmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-09-13 jesse kelley male 23 8208 campo cicare woodnicole@gmail.com +univ. nacional del comahue contador público 2020-09-13 carl smith male 25 7240 kilometro 112 spearsjared@yahoo.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-09-13 tyler young male 21 7407 libano james90@hotmail.com +univ. nacional del comahue diseño de imagen y sonido 2020-09-13 joseph gregory male 19 5730 20 de febrero brenda13@gmail.com +univ. nacional del comahue ingeniería en informática 2020-09-13 nichole payne female 31 5535 asuncion fraziersusan@yahoo.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-09-13 charles carter male 29 5753 agua linda david64@yahoo.com +univ. nacional del comahue bioquímica 2020-09-13 rodney jacobson male 30 7136 adela westjoseph@hotmail.com +univ. nacional del comahue licenciatura en psicología 2020-09-13 sandra johnson female 31 5565 campo de los andes xmeza@gmail.com +univ. nacional del comahue ingeniería mecánica 2020-09-14 veronica wilson female 37 5555 puente del inca yvelazquez@gmail.com +univ. nacional del comahue licenciatura en sociología 2020-09-14 jason chen male 22 5343 lavalle garneranthony@hotmail.com +univ. nacional del comahue técnico para bioterios 2020-09-14 michael jackson male 21 9225 arenoso holly00@yahoo.com +univ. nacional del comahue bioquímica 2020-09-14 kimberly mclean female 33 5327 capihuas robinsondavid@yahoo.com +univ. nacional del comahue diseño de imagen y sonido 2020-09-14 anthony hernandez male 29 1986 altamirano robert92@hotmail.com +univ. nacional del comahue farmacia 2020-09-14 crystal carpenter female 33 3218 arroyo palmar alicia62@gmail.com +univ. nacional del comahue agronomía 2020-09-14 alex copeland male 17 5763 general urquiza wellis@hotmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-09-14 cindy martin female 27 2527 colonia san francisco lynnholland@yahoo.com +univ. nacional del comahue licenciatura en administración 2020-09-14 brian armstrong male 37 2218 carrizales gmiller@gmail.com +univ. nacional del comahue ingeniería mecánica 2020-09-15 sara bell female 29 5407 dique toma ihoover@yahoo.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-09-15 kimberly thomas female 17 3705 10 de mayo jharris@yahoo.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-09-15 scott horton male 25 2520 la california sarah39@yahoo.com +univ. nacional del comahue diseño industrial 2020-09-15 theresa le female 30 2121 perez paulcortez@gmail.com +univ. nacional del comahue licenciatura en artes 2020-09-15 joanne anderson female 39 5306 carrizal joseph32@yahoo.com +univ. nacional del comahue licenciatura en artes 2020-09-15 steven harper male 17 6075 arenaza jennifer14@hotmail.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-09-15 david lara male 19 4722 el duraznillo nzamora@gmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-09-15 nathan vaughn male 34 6661 blas durañona coreysharp@hotmail.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-09-15 bonnie riley female 19 4622 bella vista jason74@yahoo.com +univ. nacional del comahue técnico para bioterios 2020-09-15 alexander kramer male 35 2944 rio tala jesse67@yahoo.com +univ. nacional del comahue licenciatura en ciencia política 2020-09-15 mallory moore female 27 2907 general conesa haydenthomas@gmail.com +univ. nacional del comahue arquitectura 2020-09-16 derek webb male 23 3072 la lucila marymoreno@hotmail.com +univ. nacional del comahue agronomía 2020-09-16 christopher mack male 30 9409 isla gran malvina joshua96@yahoo.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-09-16 arthur arellano male 17 8200 colonia lia y allende parrishkelly@yahoo.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-09-16 cindy bishop female 17 6050 cuartel vii vickiejenkins@hotmail.com +univ. nacional del comahue diseño industrial 2020-09-16 paula peters female 37 9315 bajo caracoles samanthahatfield@gmail.com +univ. nacional del comahue ciencias veterinarias 2020-09-16 sherry hoffman female 31 4431 aguas calientes maryreed@hotmail.com +univ. nacional del comahue bioquímica 2020-09-16 jessica burns female 19 6538 la dorita jeffreydavis@gmail.com +univ. nacional del comahue licenciatura en sociología 2020-09-16 kevin fitzgerald male 19 5266 chichagasta adavenport@gmail.com +univ. nacional del comahue licenciatura en administración 2020-09-16 ryan curtis male 29 2344 achaval rodriguez nelsonamy@yahoo.com +univ. nacional del comahue licenciatura en psicología 2020-09-16 john jones male 29 2300 colonia bella italia sheltonmatthew@gmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-09-16 deborah carter female 37 6700 caminera lujan richardjohnson@gmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-09-17 david luna male 27 3117 aldea san antonio hgardner@yahoo.com +univ. nacional del comahue técnico para bioterios 2020-09-17 jason hernandez male 21 6009 san marcelo pdavis@gmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-09-17 deborah wilson female 31 9400 an aike karen52@gmail.com +univ. nacional del comahue medicina 2020-09-17 amy smith female 19 9223 alto rio pico espinozajessica@yahoo.com +univ. nacional del comahue bioquímica 2020-09-17 joseph stevenson male 17 7172 colonia ferrari andrew27@hotmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-09-17 george schultz male 39 7160 la union dwright@gmail.com +univ. nacional del comahue ingeniería mecánica 2020-09-17 megan gardner female 35 2933 colonia velez kyle23@yahoo.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-09-17 jessica burns female 31 2613 la morocha thomas03@gmail.com +univ. nacional del comahue bioquímica 2020-09-17 tonya nguyen female 31 2200 las quintas nathanhoover@yahoo.com +univ. nacional del comahue ciencias veterinarias 2020-09-17 troy lawrence male 33 6430 adolfo alsina james77@gmail.com +univ. nacional del comahue ingeniería en informática 2020-09-17 suzanne phillips female 37 4643 antiguyos tpowers@hotmail.com +univ. nacional del comahue ingeniería mecánica 2020-09-17 nancy jones female 39 1746 francisco alvarez randy73@gmail.com +univ. nacional del comahue diseño industrial 2020-09-18 karen castillo female 27 9039 hito 45 walkerrodney@yahoo.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-09-18 christian sanchez male 35 6641 comodoro py alexis34@yahoo.com +univ. nacional del comahue licenciatura en sociología 2020-09-18 tony young male 39 2347 colonia mackinlay gordonwilliam@yahoo.com +univ. nacional del comahue bioquímica 2020-09-18 lori sanford female 24 6628 colonia zambungo xwiggins@hotmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-09-18 jane campbell female 20 7311 chillar gillespiebrian@yahoo.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-09-18 sandra miller female 17 6065 blaquier thorntonkimberly@hotmail.com +univ. nacional del comahue farmacia 2020-09-18 kathy powell female 23 3133 arroyo burgos chris21@hotmail.com +univ. nacional del comahue contador público 2020-09-18 christopher hickman male 39 7220 funke dlopez@gmail.com +univ. nacional del comahue medicina 2020-09-19 charles gardner male 31 7408 la colina vburnett@yahoo.com +univ. nacional del comahue licenciatura en ciencia política 2020-09-19 wendy green female 33 1858 villa numancia tinamccann@hotmail.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-09-19 sharon hughes female 39 4147 alto las lechuzas garyreilly@hotmail.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-09-19 patricia brown female 29 2843 general galarza jacobgarcia@hotmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-09-19 gary berry male 22 4724 agua colorada jennifer89@yahoo.com +univ. nacional del comahue licenciatura en artes 2020-09-19 alexandria lee female 23 8305 aguada san roque frankjason@gmail.com +univ. nacional del comahue ingeniería mecánica 2020-09-19 michelle simmons female 19 1655 jose leon suarez brendan58@gmail.com +univ. nacional del comahue diseño industrial 2020-09-19 mark espinoza male 38 1822 valentin alsina hfrank@hotmail.com +univ. nacional del comahue farmacia 2020-09-19 robert moore male 23 3085 pilar loriwong@hotmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-09-19 ricardo taylor male 29 1684 ciudad jardin del palomar whitney61@hotmail.com +univ. nacional del comahue arquitectura 2020-09-19 paul brown male 17 2752 almacen el descanso zwilcox@yahoo.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-09-19 martha morgan female 25 6203 el olivo tracywilkinson@hotmail.com +univ. nacional del comahue diseño de imagen y sonido 2020-09-19 robert carpenter male 27 5461 aguada de la peña anthonysmith@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-09-19 taylor duncan female 22 5755 alto del molle phillip16@yahoo.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-09-20 brenda anderson female 37 9107 28 de julio tuckerrichard@yahoo.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-09-20 ian carter male 21 4152 aguilares harrisondavid@gmail.com +univ. nacional del comahue licenciatura en sociología 2020-09-20 maria hall female 25 3164 colonia rivas bjackson@gmail.com +univ. nacional del comahue licenciatura en sociología 2020-09-20 linda collins female 23 2852 alarcon fclark@gmail.com +univ. nacional del comahue bioquímica 2020-09-20 charles torres male 25 2506 correa ralph16@yahoo.com +univ. nacional del comahue agronomía 2020-09-20 dana gonzalez female 25 6601 altamira garciajesse@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-09-20 rita thomas female 29 4237 cortaderas jacobwarren@yahoo.com +univ. nacional del comahue contador público 2020-09-20 christopher morris male 32 6343 los gauchos qgonzalez@yahoo.com +univ. nacional del comahue licenciatura en sociología 2020-09-20 christopher moore male 25 8303 cinco saltos cassandracruz@gmail.com +univ. nacional del comahue ciencias veterinarias 2020-09-20 stanley stevenson male 25 5431 apeadero guanacache monicaduncan@hotmail.com +univ. nacional del comahue licenciatura en artes 2020-09-21 jacqueline snyder female 37 8400 isla victoria charlesortiz@yahoo.com +univ. nacional del comahue diseño industrial 2020-09-21 kimberly smith female 23 5713 balde ahumada kevinrivera@gmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-09-21 reginald shepherd male 39 7107 santa teresita dudleycurtis@hotmail.com +univ. nacional del comahue licenciatura en administración 2020-09-21 donald byrd male 20 5523 buena nueva melinda63@gmail.com +univ. nacional del comahue diseño de imagen y sonido 2020-09-21 jonathan medina male 19 8208 campo cicare nicholscarlos@gmail.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-09-21 james baker male 37 1802 aeropuerto ezeiza steven22@yahoo.com +univ. nacional del comahue medicina 2020-09-21 wesley king male 31 8412 cañadon del corral amartin@hotmail.com +univ. nacional del comahue diseño de imagen y sonido 2020-09-21 robert wright male 19 4622 bella vista ashleymartinez@gmail.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-09-21 brian stevens male 25 5547 villa hipodromo michael62@gmail.com +univ. nacional del comahue ingeniería en informática 2020-09-21 robert long male 28 6648 mecha ygreen@gmail.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-09-21 connie moore female 27 1655 jose leon suarez starkjohn@hotmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-09-21 omar ross male 19 7165 faro querandi matthewking@gmail.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-09-21 cheryl nielsen female 21 2204 jesus maria lindaevans@gmail.com +univ. nacional del comahue ingeniería mecánica 2020-09-21 joseph mitchell male 39 2156 arsenal de guerra san lorenzo jimmymoreno@gmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-09-22 martha ayala female 23 4105 abra del tafi jsmith@yahoo.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-09-22 erika lee female 35 7635 el lenguaraz peggyjones@gmail.com +univ. nacional del comahue contador público 2020-09-22 brandy robinson female 39 5533 9 de julio masonhoffman@hotmail.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-09-22 eugene wong male 21 8373 alianza lisa17@gmail.com +univ. nacional del comahue ingeniería en informática 2020-09-22 manuel english male 38 6652 olascoaga xhill@hotmail.com +univ. nacional del comahue actuario 2020-09-22 claudia perez female 35 8308 villa manzano xrichardson@yahoo.com +univ. nacional del comahue diseño de imagen y sonido 2020-09-22 kimberly esparza female 27 8307 colonia gobernador ayala jeffreycooper@gmail.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-09-22 patricia wilson female 17 3051 alejandra joshuaramirez@yahoo.com +univ. nacional del comahue actuario 2020-09-22 julian smith male 33 7412 las hermanas anthonyrebekah@hotmail.com +univ. nacional del comahue licenciatura en administración 2020-09-23 chad lee male 29 6065 blaquier awalker@yahoo.com +univ. nacional del comahue licenciatura en administración 2020-09-23 paul moore male 17 8153 balneario oriente tamarasantos@gmail.com +univ. nacional del comahue licenciatura en sociología 2020-09-23 kim hoffman female 31 5381 bella vista sobrien@yahoo.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-09-23 joseph gray male 19 5615 25 de mayo jonesryan@yahoo.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-09-23 johnny carter male 37 7208 coronel boerr douglas26@hotmail.com +univ. nacional del comahue farmacia 2020-09-23 anthony johnson male 21 5624 kilometro 47 joshuarodriguez@hotmail.com +univ. nacional del comahue diseño industrial 2020-09-23 sarah martin female 27 3113 colonia celina yhughes@gmail.com +univ. nacional del comahue bioquímica 2020-09-23 maria anderson female 38 5605 calle larga vieja tanya29@yahoo.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-09-24 james garrison male 35 5261 agua del simbol angelahiggins@hotmail.com +univ. nacional del comahue ingeniería electrónica 2020-09-24 amber hall female 25 7267 alvarez de toledo bhoward@yahoo.com +univ. nacional del comahue licenciatura en musicoterapia 2020-09-24 joanna adams female 29 4101 agua negra perezjonathan@hotmail.com +univ. nacional del comahue técnico para bioterios 2020-09-24 lisa holden female 37 2454 cañada rosquin christophermorgan@yahoo.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-09-24 susan wallace female 19 2828 colonia nueva montevideo lauren17@gmail.com +univ. nacional del comahue bioquímica 2020-09-24 katherine mitchell female 35 3013 colonia matilde michaelromero@gmail.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-09-24 richard stephens male 23 6216 bagual kmoore@yahoo.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-09-24 julia lopez female 27 6507 corbett pachecosteven@gmail.com +univ. nacional del comahue licenciatura en sociología 2020-09-24 david sanders male 19 6461 capitan castro ravengill@yahoo.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-09-24 tyler lee male 39 2854 dos hermanas anthonyking@gmail.com +univ. nacional del comahue licenciatura en sociología 2020-09-24 ashley randall female 19 1708 moron rscott@gmail.com +univ. nacional del comahue agronomía 2020-09-24 breanna wells female 29 5710 la punta kevin45@yahoo.com +univ. nacional del comahue técnico para bioterios 2020-09-24 brittney gibson female 23 4159 alto el puesto johnnybradley@hotmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-09-24 joseph boyer male 29 2216 campo raffo gary33@hotmail.com +univ. nacional del comahue medicina 2020-09-24 matthew castillo male 39 5417 9 de julio smithjoshua@hotmail.com +univ. nacional del comahue bioquímica 2020-09-24 james edwards male 21 6557 arboleda bettybell@gmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-09-25 matthew taylor male 26 3060 campo san jose christopherpeterson@gmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-09-25 william figueroa male 33 7404 fortin lavalle kathleen16@yahoo.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-09-25 alicia zimmerman female 37 6453 carlos salas jasonparks@hotmail.com +univ. nacional del comahue medicina 2020-09-25 brittany holt female 19 3511 colonia coronel dorrego denise76@gmail.com +univ. nacional del comahue ingeniería en informática 2020-09-25 kathryn garcia female 21 7407 libano donnaross@yahoo.com +univ. nacional del comahue ciencias veterinarias 2020-09-25 mary morse female 39 3486 villa olivari cameronpeggy@hotmail.com +univ. nacional del comahue actuario 2020-09-25 lori hernandez female 18 3714 9 de julio justingonzales@yahoo.com +univ. nacional del comahue contador público 2020-09-25 sherry smith female 21 3007 empalme san carlos karenmccoy@yahoo.com +univ. nacional del comahue licenciatura en sociología 2020-09-25 jake gomez male 25 2403 bauer y sigel heather62@hotmail.com +univ. nacional del comahue licenciatura en administración 2020-09-25 gregory baker male 27 5579 barrio lencina hernandezchristian@yahoo.com +univ. nacional del comahue licenciatura en musicoterapia 2020-09-25 kaitlyn rice female 29 4143 independencia dparker@gmail.com +univ. nacional del comahue licenciatura en sociología 2020-09-26 amy delacruz female 21 8109 almirante solier brittanyholder@yahoo.com +univ. nacional del comahue ingeniería electrónica 2020-09-26 deborah garcia female 23 2801 alto verde martinmichelle@gmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-09-26 kevin smith male 39 2900 san nicolas de los arroyos kelseyduncan@hotmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-09-26 donald jones male 23 7109 barrio pedro rocco jeffrey29@gmail.com +univ. nacional del comahue ciencias veterinarias 2020-09-26 mark faulkner male 27 1871 dock sud englishlindsay@yahoo.com +univ. nacional del comahue contador público 2020-09-26 albert booker male 31 5407 dique toma kcarey@hotmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-09-26 julia miller female 31 1714 ituzaingo emiddleton@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-09-26 shawn campbell male 35 6383 campo moises seccion 1a bowmantammy@yahoo.com +univ. nacional del comahue arquitectura 2020-09-26 taylor tanner female 31 5306 carrizal gthomas@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-09-26 david knight male 21 4648 barrio la union tyler23@yahoo.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-09-26 shannon cuevas female 33 2930 la buana moza garnershawn@yahoo.com +univ. nacional del comahue licenciatura en artes 2020-09-26 joshua hernandez male 29 3374 el porvenir kevinparker@gmail.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-09-26 brandon hamilton male 23 5407 dique toma oholt@gmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-09-26 adam baker male 33 6643 araujo lnewman@yahoo.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-09-26 sandra knapp female 23 6628 colonia zambungo qmcgrath@yahoo.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-09-26 charles rosario male 25 7105 san clemente del tuyu donaldhorn@gmail.com +univ. nacional del comahue actuario 2020-09-26 kimberly booth female 29 3364 2 de mayo jacob03@yahoo.com +univ. nacional del comahue licenciatura en ciencia política 2020-09-26 jeanne rodriguez female 39 4701 acostilla jason48@hotmail.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-09-27 audrey guzman female 35 8107 base aeronaval cmte espora joshua14@hotmail.com +univ. nacional del comahue ingeniería mecánica 2020-09-27 anthony skinner male 23 3044 gobernador crespo karen55@gmail.com +univ. nacional del comahue bioquímica 2020-09-27 jessica jones female 36 8151 el zorro obrennan@yahoo.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-09-27 david foster male 35 2187 arteaga zjones@hotmail.com +univ. nacional del comahue licenciatura en sociología 2020-09-27 dana mcgee female 17 6511 hale nathan61@hotmail.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-09-27 jeffrey richardson male 39 5303 anjullon laura56@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-09-27 charles johnson male 31 3518 cabral cue david57@hotmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-09-27 robert gates male 37 2208 gaboto susansandoval@yahoo.com +univ. nacional del comahue medicina 2020-09-27 michael bridges male 19 2843 general galarza anthony45@gmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-09-27 anthony sutton male 29 1884 berazategui jblanchard@yahoo.com +univ. nacional del comahue diseño de imagen y sonido 2020-09-27 tammy perez female 37 1986 altamirano esmith@yahoo.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-09-27 cassandra sanford female 38 2944 rio tala luke63@hotmail.com +univ. nacional del comahue ingeniería electrónica 2020-09-27 taylor johnson male 37 6559 recalde jacobcunningham@yahoo.com +univ. nacional del comahue ingeniería mecánica 2020-09-27 kenneth newman male 31 4176 alto del puesto ereeves@yahoo.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-09-27 raymond johnson male 31 1741 enrique fynn jessicajackson@yahoo.com +univ. nacional del comahue bioquímica 2020-09-27 abigail hill female 21 5750 alto de la leña llong@hotmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-09-27 lauren miranda female 25 8185 campo del norte americano ronald22@hotmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-09-27 david haas male 33 5561 ancon michelle99@yahoo.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-09-27 linda figueroa female 27 4142 alto de leiva vtorres@yahoo.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-09-28 michele yu female 17 6403 badano lindseyjordan@hotmail.com +univ. nacional del comahue actuario 2020-09-28 andrew foster male 29 6343 los gauchos kristinjones@gmail.com +univ. nacional del comahue ingeniería electrónica 2020-09-28 richard walker male 23 5734 la ribera nraymond@hotmail.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-09-28 katherine nichols female 33 4235 albigasta nedwards@hotmail.com +univ. nacional del comahue licenciatura en artes 2020-09-28 michele lopez female 39 8105 aguara hendrixvincent@gmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-09-28 peggy edwards female 25 3351 azara nielsenangel@yahoo.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-09-28 maurice richard male 35 7519 san mayol lwalker@yahoo.com +univ. nacional del comahue licenciatura en sociología 2020-09-28 laura nolan female 21 4650 abra de peñas cookbarry@gmail.com +univ. nacional del comahue arquitectura 2020-09-28 patrick murphy male 29 8307 colonia gobernador ayala krobinson@hotmail.com +univ. nacional del comahue ingeniería electrónica 2020-09-28 randy tyler male 39 3172 kilometro 208 leslie36@hotmail.com +univ. nacional del comahue actuario 2020-09-29 kelsey powell female 35 4618 abra de pives richardstrevor@hotmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-09-29 jose garrison male 31 7600 barrio emir ramon juarez randy41@gmail.com +univ. nacional del comahue diseño de imagen y sonido 2020-09-29 jessica olson female 21 5343 lavalle sharris@yahoo.com +univ. nacional del comahue ingeniería en informática 2020-09-29 gilbert kelly male 37 5306 carrizal marissamorgan@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-09-29 michael reyes male 17 5463 alto huaco angelawong@gmail.com +univ. nacional del comahue actuario 2020-09-29 alison ewing female 34 8316 balsa senillosa schmidtelizabeth@hotmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-09-29 helen le female 23 2622 maggiolo casey14@hotmail.com +univ. nacional del comahue ingeniería en informática 2020-09-29 allison hill female 29 6727 gouin jennifermiles@hotmail.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-09-29 lisa klein female 25 5380 chamical leslienunez@yahoo.com +univ. nacional del comahue actuario 2020-09-29 amanda edwards female 31 2105 cañada rica devinmoore@yahoo.com +univ. nacional del comahue técnico para bioterios 2020-09-29 michelle johnson female 39 5442 ambas puntillas dana37@hotmail.com +univ. nacional del comahue diseño industrial 2020-09-29 heather burns female 23 3313 arroyo del medio michael54@gmail.com +univ. nacional del comahue actuario 2020-09-29 richard chavez male 31 5275 agua colorada jameshartman@yahoo.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-09-30 robert ward male 33 3263 1 de mayo nschmidt@gmail.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-09-30 kenneth rodriguez male 31 3401 arroyo pelon stephaniebenjamin@gmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-09-30 kimberly campbell female 21 9405 bahia tranquila susan73@gmail.com +univ. nacional del comahue ingeniería mecánica 2020-09-30 scott wong male 19 6360 barrio el molino bwilliams@hotmail.com +univ. nacional del comahue diseño de imagen y sonido 2020-09-30 jessica griffin female 17 3714 9 de julio martinezbonnie@gmail.com +univ. nacional del comahue diseño industrial 2020-09-30 diane jimenez female 35 9407 28 de noviembre sjohnson@yahoo.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-10-01 nicholas johnson male 39 2216 campo raffo nicholassalazar@hotmail.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-10-01 michael hester male 23 2705 haras san jacinto heather31@hotmail.com +univ. nacional del comahue contador público 2020-10-01 william thomas male 27 3061 antonio pini housealex@gmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-10-01 frank nunez male 31 8316 balsa senillosa ralph78@gmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-10-01 brenda martin female 23 2156 arsenal de guerra san lorenzo gthomas@hotmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-10-01 dawn bailey female 24 3304 barrio don santiago kylefarrell@hotmail.com +univ. nacional del comahue bioquímica 2020-10-01 tina gillespie female 30 7105 san clemente del tuyu xreeves@hotmail.com +univ. nacional del comahue técnico para bioterios 2020-10-01 amber glenn female 27 2745 gahan christyadams@gmail.com +univ. nacional del comahue medicina 2020-10-01 william osborn male 19 7600 barrio emir ramon juarez mscott@gmail.com +univ. nacional del comahue licenciatura en artes 2020-10-02 michael thompson male 25 5465 baños pismanta susanjames@yahoo.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-10-02 james romero male 31 1617 el talar tranalexandra@gmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-10-02 john adams male 35 8144 colonia monte la plata ktorres@yahoo.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-10-02 brittany hernandez female 25 7318 colonia hinojo jlong@hotmail.com +univ. nacional del comahue farmacia 2020-10-02 brian lambert male 23 8144 colonia monte la plata tvelazquez@hotmail.com +univ. nacional del comahue licenciatura en sociología 2020-10-02 christopher thompson male 29 4616 barcena duncanrobert@hotmail.com +univ. nacional del comahue ingeniería en informática 2020-10-02 sabrina thompson female 35 2732 4 de febrero watkinscarlos@yahoo.com +univ. nacional del comahue licenciatura en administración 2020-10-02 matthew huff male 25 2617 sancti spiritu oburch@hotmail.com +univ. nacional del comahue licenciatura en psicología 2020-10-02 ian murphy male 40 1854 longchamps fdavis@hotmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-10-02 michelle parker female 21 2134 roldan vickie13@yahoo.com +univ. nacional del comahue licenciatura en ciencia política 2020-10-03 rachel rich female 37 7221 francisco berra sheila33@yahoo.com +univ. nacional del comahue ingeniería en informática 2020-10-03 denise ramirez female 23 6239 gonzalez moreno rebeccaray@gmail.com +univ. nacional del comahue ingeniería en informática 2020-10-03 andrew williams male 23 5439 belgrano deanbruce@yahoo.com +univ. nacional del comahue ingeniería electrónica 2020-10-03 maria miller female 37 2843 general galarza ericksonjessica@gmail.com +univ. nacional del comahue licenciatura en artes 2020-10-03 tom fletcher male 21 7110 cuartel iv rodney68@yahoo.com +univ. nacional del comahue arquitectura 2020-10-03 stephanie watkins female 25 5427 apeadero quiroga blakemichael@yahoo.com +univ. nacional del comahue arquitectura 2020-10-03 jason jackson male 37 8122 la viticola wcain@gmail.com +univ. nacional del comahue bioquímica 2020-10-03 breanna wolf female 31 5609 aristides villanueva patrickgregory@yahoo.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-10-03 edward brown male 31 2732 4 de febrero dominic11@hotmail.com +univ. nacional del comahue licenciatura en administración 2020-10-03 jacob hawkins male 17 2806 las palmas osbornesteven@gmail.com +univ. nacional del comahue actuario 2020-10-03 kara long female 25 3340 boqueron adamscolleen@hotmail.com +univ. nacional del comahue actuario 2020-10-03 james clay male 37 4719 balcosna marykelly@gmail.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-10-03 ryan campbell male 39 7545 huanguelen robert79@hotmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-10-04 nicole oconnor female 28 5438 alto de sierra tonya62@yahoo.com +univ. nacional del comahue farmacia 2020-10-04 justin chen male 39 5595 cupiles ajohnson@yahoo.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-10-04 daniel jordan male 17 2214 aldao shatfield@hotmail.com +univ. nacional del comahue ingeniería electrónica 2020-10-04 christina arias female 29 3522 el retiro zsummers@gmail.com +univ. nacional del comahue técnico para bioterios 2020-10-04 brittany martin female 17 2900 san nicolas de los arroyos henryamber@hotmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-10-04 emily ayala female 33 6438 masurel portersusan@gmail.com +univ. nacional del comahue farmacia 2020-10-04 philip salinas male 21 6009 san marcelo tmarquez@hotmail.com +univ. nacional del comahue ciencias veterinarias 2020-10-05 gabriela mcgrath female 29 2253 campo gimenez alexisanderson@hotmail.com +univ. nacional del comahue actuario 2020-10-05 cathy long female 28 3317 arroyo magdalena ndavis@gmail.com +univ. nacional del comahue ingeniería en informática 2020-10-05 willie bradley male 23 3254 colonia la blanquita zgill@hotmail.com +univ. nacional del comahue contador público 2020-10-05 mary wallace female 30 3401 arroyo pelon coxmary@hotmail.com +univ. nacional del comahue licenciatura en administración 2020-10-05 jessica francis female 21 7517 juan e barra melissa16@gmail.com +univ. nacional del comahue licenciatura en sociología 2020-10-05 anthony compton male 37 6555 alfalad nataliecrawford@yahoo.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-10-05 casey lewis male 27 3445 9 de julio johnsonchristian@yahoo.com +univ. nacional del comahue licenciatura en artes 2020-10-05 jeremy morris male 35 1603 villa martelli misty51@hotmail.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-10-05 misty colon female 39 5563 agua amarga kcampbell@gmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-10-05 kyle smith male 27 5634 bowen kylemartin@gmail.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-10-05 jasmine salazar female 23 3425 costa grande cameronstephanie@gmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-10-05 rachel velez female 17 8349 aguas de las mulas powellchristopher@hotmail.com +univ. nacional del comahue diseño industrial 2020-10-05 anita fernandez female 37 2943 ireneo portela joneskristen@gmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-10-05 tyler ross male 39 3261 centella tanneryolanda@hotmail.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-10-05 nancy mcpherson female 19 4648 barrio la union joelsnyder@hotmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-10-05 erin hartman female 23 1718 san antonio de padua newtonmargaret@hotmail.com +univ. nacional del comahue contador público 2020-10-05 sarah johnson female 23 6437 alamos davidwilliams@yahoo.com +univ. nacional del comahue licenciatura en administración 2020-10-06 michael patel male 31 9220 cañadon la madera emily48@hotmail.com +univ. nacional del comahue arquitectura 2020-10-06 barbara lee female 23 3518 cabral cue stokesdevon@yahoo.com +univ. nacional del comahue licenciatura en musicoterapia 2020-10-06 christine strickland female 25 5590 adrian maturano rebeccaphillips@hotmail.com +univ. nacional del comahue ingeniería en informática 2020-10-06 roger ramirez male 27 1826 remedios de escalada alexanderrobinson@yahoo.com +univ. nacional del comahue licenciatura en sociología 2020-10-06 jeffrey curtis male 31 7601 barrio batan mhendricks@yahoo.com +univ. nacional del comahue diseño industrial 2020-10-06 justin hopkins male 39 6439 bonifacio chanchristina@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-10-06 marcus hall male 23 5303 anjullon david12@gmail.com +univ. nacional del comahue ciencias veterinarias 2020-10-06 tiffany gilbert female 25 2725 hughes yingram@yahoo.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-10-06 brian smith male 27 4231 albigasta yhenderson@hotmail.com +univ. nacional del comahue actuario 2020-10-06 jeff gonzales male 17 8322 cutral co robert54@gmail.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-10-06 kimberly blair female 31 2914 costa brava robertbraun@gmail.com +univ. nacional del comahue medicina 2020-10-06 terry cox male 29 5719 agua amarga galvancynthia@hotmail.com +univ. nacional del comahue medicina 2020-10-06 brian huber male 27 1739 general hornos mwarren@yahoo.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-10-06 april rodriguez female 27 1640 acassuso ylee@yahoo.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-10-06 raymond coleman male 17 6337 ingeniero thompson jeffery22@yahoo.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-10-06 thomas thomas male 23 5505 carbometal carrie51@yahoo.com +univ. nacional del comahue licenciatura en sociología 2020-10-06 tyler morales male 39 6667 agustin mosconi michaelhogan@gmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-10-07 timothy keller male 21 5605 calle larga vieja mmccall@hotmail.com +univ. nacional del comahue ingeniería electrónica 2020-10-07 jake brown male 29 3204 ayui parada hayesbenjamin@yahoo.com +univ. nacional del comahue técnico para bioterios 2020-10-07 michael coleman male 17 1879 quilmes oeste toni31@gmail.com +univ. nacional del comahue licenciatura en artes 2020-10-07 kenneth garcia male 32 5361 aicuña crawfordangela@yahoo.com +univ. nacional del comahue licenciatura en musicoterapia 2020-10-07 luis mueller male 37 5500 cerro aconcagua jamessanders@yahoo.com +univ. nacional del comahue licenciatura en administración 2020-10-07 christine watson female 25 3117 aldea san antonio charlestran@yahoo.com +univ. nacional del comahue farmacia 2020-10-07 lisa saunders female 35 4195 7 de abril ywilliams@hotmail.com +univ. nacional del comahue diseño de imagen y sonido 2020-10-07 juan howard male 19 8300 las perlas ptaylor@yahoo.com +univ. nacional del comahue licenciatura en administración 2020-10-07 robert jones male 29 2745 gahan gloriasalinas@gmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-10-07 melanie maxwell female 17 8503 chocori frazierkara@gmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-10-07 anne marquez female 31 4743 aconquija tiffany19@gmail.com +univ. nacional del comahue técnico para bioterios 2020-10-07 victoria ford female 21 6058 pazos kanki danagoodwin@hotmail.com +univ. nacional del comahue agronomía 2020-10-07 paul daniels male 25 1763 virrey del pino cartercasey@gmail.com +univ. nacional del comahue diseño de imagen y sonido 2020-10-07 terrance martin male 21 8415 arroyo las minas watkinsclaire@hotmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-10-07 carol shaw female 37 9101 alto de las plumas lindsey45@gmail.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-10-07 carolyn baker female 37 4653 casira qingram@hotmail.com +univ. nacional del comahue diseño de imagen y sonido 2020-10-07 robert garcia male 31 2600 boca p 25 jamessmith@hotmail.com +univ. nacional del comahue bioquímica 2020-10-07 jessica hancock female 23 6614 franklin sanchezcarl@hotmail.com +univ. nacional del comahue ciencias veterinarias 2020-10-08 mary gonzalez female 33 6063 porvenir susanjones@yahoo.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-10-08 thomas ferguson male 31 3133 arroyo burgos rramos@gmail.com +univ. nacional del comahue diseño industrial 2020-10-08 joshua hernandez male 30 3183 albariño jessicadavis@yahoo.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-10-08 katie washington female 27 6341 chapi talo linda72@yahoo.com +univ. nacional del comahue medicina 2020-10-08 matthew fox male 37 5612 valle de las leñas alyssarodriguez@yahoo.com +univ. nacional del comahue contador público 2020-10-08 jasmine rodriguez female 29 4632 antumpa lpratt@yahoo.com +univ. nacional del comahue licenciatura en artes 2020-10-08 jacob copeland male 17 2500 cañada de gomez gregorydougherty@gmail.com +univ. nacional del comahue diseño de imagen y sonido 2020-10-08 julie garcia female 27 5577 el alto daniel38@hotmail.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-10-08 william thomas male 17 4159 alto el puesto orobinson@yahoo.com +univ. nacional del comahue licenciatura en ciencia política 2020-10-08 austin saunders male 29 6450 abel cruzmichael@gmail.com +univ. nacional del comahue arquitectura 2020-10-08 david ferguson male 25 2187 arteaga sgilbert@gmail.com +univ. nacional del comahue ingeniería electrónica 2020-10-08 gloria smith female 33 2846 anahi jmiller@yahoo.com +univ. nacional del comahue ingeniería en informática 2020-10-09 michael oliver male 25 6621 anderson thomasstephanie@gmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-10-09 kathryn valdez female 29 2743 arroyo dulce tinawolf@hotmail.com +univ. nacional del comahue farmacia 2020-10-09 belinda willis female 37 6701 carlos keen goldenryan@hotmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-10-09 jason haynes male 25 2208 gaboto mullinssean@gmail.com +univ. nacional del comahue arquitectura 2020-10-09 alexandria black female 25 5265 agua los matos billy87@yahoo.com +univ. nacional del comahue ingeniería en informática 2020-10-09 ian morris male 31 1895 arturo segui ygonzales@gmail.com +univ. nacional del comahue diseño industrial 2020-10-09 glen reilly male 32 6214 casimiro gomez vfernandez@yahoo.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-10-09 david dudley male 35 5333 banda de lucero youngdavid@hotmail.com +univ. nacional del comahue ciencias veterinarias 2020-10-10 tracy johnson female 31 4709 san jose de piedra blanca michael34@gmail.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-10-10 matthew vaughn male 17 3080 colonia pujol msanchez@yahoo.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-10-10 crystal ray female 17 7404 fortin lavalle shortangela@yahoo.com +univ. nacional del comahue diseño industrial 2020-10-10 victoria howe female 19 2115 colonia valdez margaretsmith@hotmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-10-10 jay holland male 17 7623 campo la plata dustin47@gmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-10-10 allison mclaughlin female 33 3587 san antonio de obligado yodermaria@gmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-10-10 aaron lyons male 33 2600 boca p 25 mhutchinson@yahoo.com +univ. nacional del comahue ingeniería en informática 2020-10-10 brandi mahoney female 17 1676 santos lugares mark87@gmail.com +univ. nacional del comahue medicina 2020-10-10 kristina welch female 33 7011 aneque grande brownlawrence@hotmail.com +univ. nacional del comahue diseño industrial 2020-10-10 amy bonilla female 31 2347 colonia mackinlay erika40@gmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-10-10 jason wilson male 35 9033 aldea apeleg heathergamble@yahoo.com +univ. nacional del comahue arquitectura 2020-10-11 cody hunt male 33 3214 estacion yerua keith37@hotmail.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-10-11 anthony fernandez male 17 3463 aristia gregoryhoffman@yahoo.com +univ. nacional del comahue ingeniería mecánica 2020-10-11 duane campbell male 27 1647 zona delta san fernando jamesmoore@yahoo.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-10-11 james gates male 33 5265 agua los matos christopher21@gmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-10-11 wesley harris male 27 5545 agua de diaz douglasmartin@gmail.com +univ. nacional del comahue medicina 2020-10-11 derek wade male 27 2821 arroyo del cura tiffanyperez@gmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-10-11 destiny garcia female 27 5460 agua de la zorra brandtdavid@yahoo.com +univ. nacional del comahue licenciatura en psicología 2020-10-12 chelsea fletcher female 25 2764 campo la nena kmoreno@hotmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-10-12 chase hicks male 25 7607 balneario atlantida amber24@hotmail.com +univ. nacional del comahue técnico para bioterios 2020-10-12 rachel mills female 35 1980 barrio la dolly andrew99@yahoo.com +univ. nacional del comahue actuario 2020-10-12 jeremy johnson male 19 2340 ceres scottbaxter@gmail.com +univ. nacional del comahue arquitectura 2020-10-12 april thomas female 25 6337 ingeniero thompson erin38@yahoo.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-10-12 roberta wheeler female 26 4709 san jose de piedra blanca elizabethnichols@yahoo.com +univ. nacional del comahue ingeniería en informática 2020-10-12 caroline thompson female 19 2854 dos hermanas solisamy@yahoo.com +univ. nacional del comahue licenciatura en administración 2020-10-12 oscar miller male 27 8175 goyena pmann@hotmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-10-12 jason lewis male 33 9050 gobernador moyano tmcmahon@gmail.com +univ. nacional del comahue farmacia 2020-10-12 alan martinez male 27 1718 san antonio de padua brownjustin@yahoo.com +univ. nacional del comahue actuario 2020-10-12 erin nichols female 39 9207 arroyo guilaia sean31@gmail.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-10-12 julie decker female 31 3194 paso telegrafo robertgoodwin@gmail.com +univ. nacional del comahue licenciatura en administración 2020-10-12 carla wagner female 27 2109 acebal sheena43@gmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-10-13 cindy adams female 40 2505 campo la riviere lewisduane@yahoo.com +univ. nacional del comahue técnico para bioterios 2020-10-13 kimberly poole female 31 5601 capitan montoya uoconnor@hotmail.com +univ. nacional del comahue bioquímica 2020-10-13 ann smith female 29 3023 cululu wrightwilliam@hotmail.com +univ. nacional del comahue contador público 2020-10-13 lisa collier female 27 6634 alberti casestacey@yahoo.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-10-13 catherine garcia female 31 7167 carilo ygarcia@gmail.com +univ. nacional del comahue diseño industrial 2020-10-13 jason white male 23 7201 colman birdsara@hotmail.com +univ. nacional del comahue ingeniería electrónica 2020-10-13 juan sanchez male 19 1617 el talar aimee12@yahoo.com +univ. nacional del comahue licenciatura en artes 2020-10-13 kyle mata male 25 5609 aristides villanueva garciasean@hotmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-10-13 jessica graves female 29 6651 ingeniero de madrid rodriguezwilliam@gmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-10-13 eric wilson male 17 3541 campo las puertas jeffreymontgomery@hotmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-10-13 sandra jones female 37 3316 arroyo pastora morrismichael@gmail.com +univ. nacional del comahue bioquímica 2020-10-13 brandon jones male 39 2845 colonia duportal mjackson@gmail.com +univ. nacional del comahue contador público 2020-10-13 terry rodriguez male 35 6007 arribeños lisajohnston@yahoo.com +univ. nacional del comahue medicina 2020-10-13 susan wolf female 37 5615 25 de mayo cross@yahoo.com +univ. nacional del comahue licenciatura en sociología 2020-10-13 jeffrey campbell male 35 3337 adolfo j pomar paulcarroll@gmail.com +univ. nacional del comahue licenciatura en psicología 2020-10-14 paula scott female 19 2173 campo pesoa nicholas30@gmail.com +univ. nacional del comahue ingeniería electrónica 2020-10-14 misty murphy female 17 9411 base aerea teniente matienzo bradleyalexander@gmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-10-14 diane black female 25 4231 albigasta williamrice@hotmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-10-14 brianna williams female 40 4601 corral de piedras davidmiller@gmail.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-10-14 marissa martinez female 37 1885 guillermo e hudson lisaneal@hotmail.com +univ. nacional del comahue agronomía 2020-10-14 jonathon wilson male 37 3501 campo de galnasi kkennedy@yahoo.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-10-14 steve bender male 35 4235 albigasta lrogers@gmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-10-14 barbara spears female 21 6433 arturo vatteone cindy96@hotmail.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-10-14 connie duncan female 37 5584 barrio villa adela pparsons@yahoo.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-10-14 melissa browning female 23 2709 los indios michelle02@hotmail.com +univ. nacional del comahue diseño de imagen y sonido 2020-10-15 nicole williams female 37 5735 colonia bella vista pamelasoto@hotmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-10-15 natalie schaefer female 35 1776 9 de abril grace96@hotmail.com +univ. nacional del comahue diseño de imagen y sonido 2020-10-15 alyssa lam female 21 5881 cañada la negra antonio84@yahoo.com +univ. nacional del comahue licenciatura en ciencia política 2020-10-15 elizabeth harris female 19 1847 rafael calzada mcarr@yahoo.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-10-15 matthew barton male 29 5587 barcala ryanharper@gmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-10-15 christopher lee male 37 8174 arroyo aguas blancas farmerjohnny@yahoo.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-10-15 julie warren female 29 9050 gobernador moyano alejandro81@gmail.com +univ. nacional del comahue farmacia 2020-10-15 stacey garcia female 21 3220 arroyo manganga jane46@hotmail.com +univ. nacional del comahue licenciatura en artes 2020-10-15 richard fields male 29 7607 balneario atlantida orozcojohn@hotmail.com +univ. nacional del comahue licenciatura en sociología 2020-10-15 dustin frey male 27 3269 arroyo baru danielleharmon@hotmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-10-15 wendy reyes female 18 6058 pazos kanki kellybrittany@gmail.com +univ. nacional del comahue contador público 2020-10-16 courtney pace female 23 8101 calderon jellis@hotmail.com +univ. nacional del comahue diseño industrial 2020-10-16 frederick fletcher male 19 7220 funke matthew01@gmail.com +univ. nacional del comahue contador público 2020-10-16 tracy weeks female 19 1676 santos lugares robertrocha@gmail.com +univ. nacional del comahue ciencias veterinarias 2020-10-16 mark powell male 35 4122 alizal kirsten42@gmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-10-16 david ford male 39 3371 cabure angelamora@hotmail.com +univ. nacional del comahue actuario 2020-10-16 john wilson male 31 3052 cañadita john88@yahoo.com +univ. nacional del comahue diseño industrial 2020-10-16 nicholas harris male 35 8403 alicura spencerjose@yahoo.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-10-16 kathy rojas female 35 4146 barrio belgrano pluna@hotmail.com +univ. nacional del comahue ingeniería mecánica 2020-10-16 trevor franklin male 37 7263 el chumbeau danielhines@yahoo.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-10-16 joanne lewis female 35 4606 colonia los lapachos vcarney@gmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-10-16 jeremy petersen male 21 5276 baldes de pacheco tammy85@hotmail.com +univ. nacional del comahue diseño de imagen y sonido 2020-10-17 doris davis female 33 3532 curandu daniellejohnson@yahoo.com +univ. nacional del comahue licenciatura en ciencia política 2020-10-17 andrew smith male 35 3136 alcaraz norte kcoleman@yahoo.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-10-17 melissa young female 31 6616 castilla rebecca05@hotmail.com +univ. nacional del comahue medicina 2020-10-17 joe horne male 37 1682 martin coronado robertbennett@yahoo.com +univ. nacional del comahue ciencias veterinarias 2020-10-17 susan maldonado female 22 5400 desamparados ashley87@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-10-17 courtney brennan female 23 3199 los laureles rosesharp@gmail.com +univ. nacional del comahue licenciatura en artes 2020-10-17 anthony thompson male 35 6530 carlos casares nicholasgill@hotmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-10-17 martha johnson female 37 3366 almirante brown luis60@gmail.com +univ. nacional del comahue ciencias veterinarias 2020-10-17 april roth female 27 6411 bravo del dos susan58@yahoo.com +univ. nacional del comahue ciencias veterinarias 2020-10-17 nichole reyes female 39 6311 campo de los toros bethanystanley@gmail.com +univ. nacional del comahue bioquímica 2020-10-17 jonathan baird male 35 3066 campo garay gloriaarroyo@yahoo.com +univ. nacional del comahue ingeniería electrónica 2020-10-17 carol nelson female 35 3332 capiovi brandtjason@yahoo.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-10-17 tracy wells female 40 8203 la chirlandia thompsonbradley@yahoo.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-10-17 john johnson male 23 7265 cazon howeheather@hotmail.com +univ. nacional del comahue ingeniería en informática 2020-10-17 derek warren male 29 3531 colonia aborigen umoore@hotmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-10-18 nicole whitaker female 31 7112 aguas verdes kcarter@yahoo.com +univ. nacional del comahue licenciatura en psicología 2020-10-18 karen king female 33 6018 colonia los bosques sarah48@gmail.com +univ. nacional del comahue contador público 2020-10-18 christopher martinez male 29 6513 colonia las yescas michael37@hotmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-10-18 heather terrell female 33 6239 gonzalez moreno xreed@yahoo.com +univ. nacional del comahue licenciatura en psicología 2020-10-18 ricky garcia male 38 6070 balsa dball@yahoo.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-10-18 heather martinez female 33 8336 gobernador duval bgarcia@gmail.com +univ. nacional del comahue medicina 2020-10-18 samantha bernard female 39 1815 escuela agricola don bosco heatherlee@yahoo.com +univ. nacional del comahue licenciatura en ciencia política 2020-10-18 hector reyes male 33 5591 alpatacal rmartinez@gmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-10-18 timothy gibson male 35 6050 cuartel vii christopherevans@gmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-10-18 allen ramirez male 19 4168 agua blanca sullivanryan@gmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-10-18 joseph mata male 19 6305 atreuco zbartlett@hotmail.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-10-18 sarah shaffer female 17 1636 la lucila melanie86@gmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-10-18 john lee male 29 4147 alto las lechuzas saundersamy@yahoo.com +univ. nacional del comahue ingeniería en informática 2020-10-19 julia smith female 17 2806 las palmas james31@hotmail.com +univ. nacional del comahue arquitectura 2020-10-19 angela mullins female 29 2103 colonia escribano kentjill@gmail.com +univ. nacional del comahue arquitectura 2020-10-19 peter spencer male 21 6001 agustin roca donnavaldez@hotmail.com +univ. nacional del comahue licenciatura en administración 2020-10-19 stephanie benjamin female 28 1744 cuartel v agoodman@yahoo.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-10-19 matthew hughes male 25 6665 ernestina mcguirelaura@yahoo.com +univ. nacional del comahue licenciatura en ciencia política 2020-10-19 sonia sanders female 29 7408 la colina christopher59@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-10-19 thomas dean male 23 1774 la salada fsmith@yahoo.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-10-19 stephen gonzalez male 23 5636 favelli qmora@gmail.com +univ. nacional del comahue licenciatura en artes 2020-10-19 michael luna male 23 8117 alferez san martin james83@hotmail.com +univ. nacional del comahue ingeniería en informática 2020-10-19 timothy wood male 25 4101 agua negra maldonadomichael@yahoo.com +univ. nacional del comahue licenciatura en psicología 2020-10-19 charles taylor male 27 4242 25 de mayo renee64@hotmail.com +univ. nacional del comahue licenciatura en sociología 2020-10-19 cassandra serrano female 29 8000 adela corti aaronlove@hotmail.com +univ. nacional del comahue ciencias veterinarias 2020-10-20 christopher norman male 25 3326 colonia leiva millertimothy@yahoo.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-10-20 brenda gamble female 21 4134 acheral angel72@gmail.com +univ. nacional del comahue ingeniería en informática 2020-10-20 philip wang male 19 8416 anecon grande liukathryn@yahoo.com +univ. nacional del comahue ciencias veterinarias 2020-10-20 autumn mcgee female 39 8133 la rosa fdoyle@hotmail.com +univ. nacional del comahue técnico para bioterios 2020-10-20 daniel glenn male 34 3586 campo yaguarete pjohnson@hotmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-10-20 benjamin lopez male 25 1686 hurlingham johnsonrebecca@gmail.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-10-20 kaitlyn strong female 35 4147 alto las lechuzas tnichols@yahoo.com +univ. nacional del comahue ciencias veterinarias 2020-10-20 joel dorsey male 39 5595 cupiles christopher37@gmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-10-20 theresa scott female 19 1872 sarandi mirandalarson@yahoo.com +univ. nacional del comahue medicina 2020-10-20 colleen rodriguez female 39 6070 balsa wadecheryl@gmail.com +univ. nacional del comahue ingeniería mecánica 2020-10-20 christina nelson female 33 8134 argerich fbennett@gmail.com +univ. nacional del comahue ciencias veterinarias 2020-10-20 bryan copeland male 33 6605 campo peña lopez jsnyder@gmail.com +univ. nacional del comahue arquitectura 2020-10-20 melinda walter female 29 8111 arroyo pareja bushbrett@yahoo.com +univ. nacional del comahue ingeniería electrónica 2020-10-21 jose navarro male 35 4633 san pedro de iruya fweaver@hotmail.com +univ. nacional del comahue licenciatura en sociología 2020-10-21 tammy gibson female 31 6417 casbas john91@hotmail.com +univ. nacional del comahue licenciatura en administración 2020-10-21 kevin perez male 26 4137 abra baya rasmussenluis@yahoo.com +univ. nacional del comahue ingeniería electrónica 2020-10-21 joshua patterson male 17 7208 coronel boerr baileyrose@yahoo.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-10-21 kayla hall female 36 4705 aguadita jack59@hotmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-10-21 michael chase male 22 6075 arenaza milleraaron@yahoo.com +univ. nacional del comahue licenciatura en ciencia política 2020-10-21 michele mooney female 23 3586 campo yaguarete michaelleon@gmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-10-21 sierra kaiser female 39 2508 armstrong sarah66@yahoo.com +univ. nacional del comahue farmacia 2020-10-21 mary perez female 17 2745 gahan mzimmerman@gmail.com +univ. nacional del comahue bioquímica 2020-10-21 robert mendoza male 25 8373 alianza castanedadalton@yahoo.com +univ. nacional del comahue bioquímica 2020-10-21 kelly bauer female 29 3265 arroyo caraballo ccoleman@hotmail.com +univ. nacional del comahue licenciatura en sociología 2020-10-21 jacqueline ingram female 35 5529 colonia bombal joseph84@hotmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-10-22 amanda williams female 25 1735 el durazno eadams@yahoo.com +univ. nacional del comahue licenciatura en psicología 2020-10-22 christopher palmer male 27 1911 bme bavio gral mansilla sarah42@gmail.com +univ. nacional del comahue diseño industrial 2020-10-22 natalie lowe female 27 6277 buena esperanza ann54@gmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-10-22 benjamin lee male 29 8172 arroyo corto ecox@hotmail.com +univ. nacional del comahue medicina 2020-10-22 emily baker female 25 5365 el jumeal robert98@yahoo.com +univ. nacional del comahue ingeniería mecánica 2020-10-22 spencer christian male 32 2743 arroyo dulce steven06@hotmail.com +univ. nacional del comahue contador público 2020-10-22 jason mays male 21 2204 jesus maria mcneildaniel@hotmail.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-10-22 deborah woods female 31 2705 haras san jacinto littleshannon@yahoo.com +univ. nacional del comahue licenciatura en sociología 2020-10-22 jackie garrett female 19 3056 campo coubert ashley35@yahoo.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-10-22 mike johnson male 35 3337 adolfo j pomar colejamie@yahoo.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-10-22 vanessa walton female 27 9310 aguada alegre kholloway@gmail.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-10-22 victoria dixon female 22 7517 juan e barra john81@yahoo.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-10-22 alexis thompson female 39 2200 las quintas kenglish@gmail.com +univ. nacional del comahue técnico para bioterios 2020-10-23 gabriel dawson male 37 7212 doctor domingo harosteguy richardwilliams@gmail.com +univ. nacional del comahue agronomía 2020-10-23 parker shaw male 31 6652 olascoaga johnsonpatricia@hotmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-10-23 sean zimmerman male 39 4184 bustamante cynthia55@hotmail.com +univ. nacional del comahue licenciatura en sociología 2020-10-23 justin mcmillan male 29 4242 25 de mayo njimenez@hotmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-10-23 matthew stephenson male 21 3020 campo santo domingo tanner43@yahoo.com +univ. nacional del comahue licenciatura en administración 2020-10-23 jeremy blackburn male 19 5303 anjullon blake46@gmail.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-10-23 raymond morris male 19 7637 la dulce daviskari@yahoo.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-10-23 laura gibson female 17 3087 felicia carmenmckinney@yahoo.com +univ. nacional del comahue actuario 2020-10-23 debra scott female 17 6389 alegria hsampson@gmail.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-10-23 lawrence stanley male 31 7531 despeñaderos ryan81@yahoo.com +univ. nacional del comahue arquitectura 2020-10-23 patrick gray male 25 2403 bauer y sigel rebekah02@gmail.com +univ. nacional del comahue licenciatura en sociología 2020-10-23 david singh male 37 3516 basail fbaker@hotmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-10-23 david erickson male 17 2814 alto los cardales caseyburgess@yahoo.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-10-24 cynthia rodgers female 33 3386 caraguatay johnsonjason@yahoo.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-10-24 kendra adams female 35 2713 manuel ocampo nathaniel92@yahoo.com +univ. nacional del comahue ingeniería mecánica 2020-10-24 ryan fitzgerald male 23 5357 el horno fowlermorgan@yahoo.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-10-24 troy mejia male 25 2144 campo horquesco coffeylatoya@gmail.com +univ. nacional del comahue contador público 2020-10-24 james anderson male 27 5600 agua de la mula hrivera@yahoo.com +univ. nacional del comahue licenciatura en artes 2020-10-24 christine blackburn female 31 4504 23 de agosto zjennings@yahoo.com +univ. nacional del comahue ingeniería mecánica 2020-10-24 brett castillo male 22 6551 juan f ibarra mollybaker@yahoo.com +univ. nacional del comahue licenciatura en administración 2020-10-24 spencer campbell male 23 5596 12 de octubre april21@yahoo.com +univ. nacional del comahue licenciatura en artes 2020-10-24 justin salinas male 25 3005 colonia california patricia51@hotmail.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-10-24 sarah williams female 39 2728 melincue williamreed@gmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-10-24 patty perez female 29 1895 arturo segui mmoore@gmail.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-10-25 kevin drake male 29 3543 colonia lote 12 orobinson@hotmail.com +univ. nacional del comahue medicina 2020-10-25 brett ferguson male 28 3300 arroyo mmckenzie@gmail.com +univ. nacional del comahue arquitectura 2020-10-25 sarah lowe female 37 1886 ranelagh jamesthompson@gmail.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-10-25 michael ortiz male 29 3448 alamo wbowman@hotmail.com +univ. nacional del comahue actuario 2020-10-25 shannon weber female 39 2635 cañada del ucle ashleymcgee@yahoo.com +univ. nacional del comahue diseño industrial 2020-10-25 james leblanc male 39 6476 chiclana carrollstephen@yahoo.com +univ. nacional del comahue medicina 2020-10-25 christine bradford female 29 2111 francisco paz loganpatrick@yahoo.com +univ. nacional del comahue diseño de imagen y sonido 2020-10-25 mary waters female 17 8322 cutral co bdominguez@yahoo.com +univ. nacional del comahue agronomía 2020-10-25 paul petty male 23 5405 agua y energia carrillohenry@hotmail.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-10-25 scott sharp male 23 4133 la banda morganwhitney@yahoo.com +univ. nacional del comahue licenciatura en musicoterapia 2020-10-25 megan wilson female 37 7513 adolfo gonzales chaves woodstephanie@yahoo.com +univ. nacional del comahue contador público 2020-10-25 allison miller female 37 8181 azopardo aalvarez@gmail.com +univ. nacional del comahue arquitectura 2020-10-25 andrea hardin female 31 5637 30 de octubre dbrown@yahoo.com +univ. nacional del comahue licenciatura en sociología 2020-10-25 denise gray female 27 2754 campo crisol reedjonathan@gmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-10-25 veronica torres female 23 9200 arroyo pescado john69@gmail.com +univ. nacional del comahue diseño de imagen y sonido 2020-10-25 ethan hopkins male 37 3009 el tropezon bradshawshannon@yahoo.com +univ. nacional del comahue licenciatura en musicoterapia 2020-10-25 joseph johnson male 38 3137 alcaraz sud danielreynolds@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-10-25 molly clark female 37 8126 aldea san andres christopher24@yahoo.com +univ. nacional del comahue licenciatura en artes 2020-10-25 melvin anthony male 23 7240 kilometro 112 keyanna@hotmail.com +univ. nacional del comahue ciencias veterinarias 2020-10-25 nicole jones female 37 8204 bernasconi deanmichelle@yahoo.com +univ. nacional del comahue actuario 2020-10-26 michele beck female 29 6608 agote veronicabaker@gmail.com +univ. nacional del comahue arquitectura 2020-10-26 meredith fisher female 33 9111 bahia bustamante lgriffith@hotmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-10-26 linda bradley female 27 3400 bañado norte kathleenmiller@hotmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-10-26 selena mays female 23 6105 cañada seca zjames@gmail.com +univ. nacional del comahue farmacia 2020-10-26 jason king male 23 2445 cristolia adam27@hotmail.com +univ. nacional del comahue ingeniería en informática 2020-10-26 debra todd female 21 6509 del valle gregorybeck@hotmail.com +univ. nacional del comahue medicina 2020-10-26 lisa thompson female 37 4135 caspinchango figueroaerica@yahoo.com +univ. nacional del comahue técnico para bioterios 2020-10-26 colton barrett male 17 5431 apeadero guanacache zhudson@yahoo.com +univ. nacional del comahue diseño industrial 2020-10-26 megan palmer female 22 8200 colonia lia y allende josephrobinson@hotmail.com +univ. nacional del comahue ingeniería mecánica 2020-10-26 ellen jacobs female 33 3581 campo redondo peggy98@yahoo.com +univ. nacional del comahue arquitectura 2020-10-26 diane jones female 27 3162 aranguren carlblack@hotmail.com +univ. nacional del comahue licenciatura en sociología 2020-10-26 derek jones male 25 5517 cespedes emilymccullough@hotmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-10-27 kimberly guzman female 38 6346 pellegrini vmcknight@hotmail.com +univ. nacional del comahue licenciatura en artes 2020-10-27 laura harris female 25 5275 agua colorada woodlarry@gmail.com +univ. nacional del comahue licenciatura en artes 2020-10-27 corey rhodes male 34 6051 ingeniero balbin lopezsusan@gmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-10-27 robert cameron male 25 2156 arsenal de guerra san lorenzo deniseelliott@gmail.com +univ. nacional del comahue ingeniería mecánica 2020-10-27 robert bailey male 33 5300 amilgancho ymitchell@gmail.com +univ. nacional del comahue licenciatura en artes 2020-10-27 daniel rodgers male 39 6065 blaquier chenson@hotmail.com +univ. nacional del comahue contador público 2020-10-27 donald harrell male 25 8353 aguada chacay co moorecarlos@yahoo.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-10-27 rebecca bass female 35 2722 wheelwright melissasmith@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-10-27 john armstrong male 29 2400 villani jennifer88@gmail.com +univ. nacional del comahue licenciatura en sociología 2020-10-27 charles york male 39 3009 el tropezon michellewoods@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-10-28 victoria bradley female 33 1834 temperley ambersmith@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-10-28 jessica cox female 21 2930 la buana moza frankdavid@hotmail.com +univ. nacional del comahue medicina 2020-10-28 susan ayers female 37 3378 22 de diciembre zmarks@hotmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-10-28 michael palmer male 19 3374 el porvenir anneflores@gmail.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-10-28 david diaz male 23 3170 alberto gerchunoff rhonda46@yahoo.com +univ. nacional del comahue técnico para bioterios 2020-10-28 angelica gomez female 17 7150 ayacucho mary97@yahoo.com +univ. nacional del comahue medicina 2020-10-28 sydney jones female 39 4146 barrio belgrano autumn85@yahoo.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-10-28 timothy rogers male 23 3187 atencio ccunningham@yahoo.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-10-28 william mcbride male 23 2720 colon shepardcaleb@yahoo.com +univ. nacional del comahue medicina 2020-10-28 michele gilbert female 39 2635 cañada del ucle vlogan@hotmail.com +univ. nacional del comahue diseño de imagen y sonido 2020-10-29 philip nguyen male 23 3470 arroyo grande christine03@yahoo.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-10-29 rachel gonzalez female 23 3133 arroyo burgos daniel74@gmail.com +univ. nacional del comahue bioquímica 2020-10-29 douglas castro male 33 6605 campo peña lopez omurphy@yahoo.com +univ. nacional del comahue agronomía 2020-10-29 marcus evans male 37 5609 aristides villanueva campostiffany@hotmail.com +univ. nacional del comahue diseño de imagen y sonido 2020-10-29 laura frey female 31 6607 anasagasti scott46@hotmail.com +univ. nacional del comahue diseño de imagen y sonido 2020-10-29 phillip smith male 29 1778 ciudad evita kjones@yahoo.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-10-29 gerald miller male 31 6315 colonia baron jacobsthomas@gmail.com +univ. nacional del comahue agronomía 2020-10-29 james torres male 40 9019 aguada escondida vjarvis@yahoo.com +univ. nacional del comahue ciencias veterinarias 2020-10-29 justin adams male 31 3526 gandolfi todd55@yahoo.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-10-29 christopher gaines male 33 2740 almacen la colina brittanymontgomery@gmail.com +univ. nacional del comahue técnico para bioterios 2020-10-29 peter ramos male 19 7517 juan e barra xortega@hotmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-10-29 aaron sims male 38 5276 baldes de pacheco msmith@gmail.com +univ. nacional del comahue ingeniería electrónica 2020-10-29 dan perez male 37 7000 cantera aguirre jessicavasquez@yahoo.com +univ. nacional del comahue farmacia 2020-10-29 chloe lambert female 35 5421 la tranca katherine72@gmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-10-29 beth gray female 25 3113 colonia celina sonya51@yahoo.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-10-30 darlene baxter female 31 4139 agua amarilla la hoyada robertclark@yahoo.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-10-30 dawn anderson female 37 6605 campo peña lopez perezmichael@hotmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-10-30 gina ruiz female 23 5591 alpatacal andersondanielle@gmail.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-10-30 rebecca henderson female 31 1644 victoria fmason@gmail.com +univ. nacional del comahue licenciatura en sociología 2020-10-30 brett garcia male 23 2813 arroyo de la cruz clarknichole@gmail.com +univ. nacional del comahue ciencias veterinarias 2020-10-30 jenna diaz female 25 9000 comodoro rivadavia nburns@hotmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-10-30 jill gardner female 19 2443 colonia margarita jasonchristensen@gmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-10-30 angela perkins female 37 5507 baños lunlunta gmaldonado@yahoo.com +univ. nacional del comahue contador público 2020-10-31 amanda hill female 32 8129 17 de agosto tyler57@hotmail.com +univ. nacional del comahue ciencias veterinarias 2020-10-31 erik mcdaniel male 31 3016 san jose kimberlycontreras@yahoo.com +univ. nacional del comahue técnico para bioterios 2020-10-31 chelsea simpson female 21 2241 larrechea rwood@yahoo.com +univ. nacional del comahue medicina 2020-10-31 mark middleton male 37 5713 balde ahumada rhodeselizabeth@yahoo.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-10-31 deborah bishop female 23 3232 cabred qalvarez@yahoo.com +univ. nacional del comahue medicina 2020-10-31 zachary jordan male 31 1742 paso del rey jacqueline73@hotmail.com +univ. nacional del comahue agronomía 2020-10-31 bridget james female 24 4624 abra mayo harrisonrandall@gmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-10-31 timothy costa male 23 5384 punta de los llanos zhernandez@yahoo.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-10-31 nicholas flores male 19 8500 el dique jason54@yahoo.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-10-31 anna davis female 31 3194 paso telegrafo deborah18@hotmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-10-31 christopher wright male 37 6471 atahualpa teresasmith@hotmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-11-01 raymond craig male 25 5707 aguaditas sarah15@hotmail.com +univ. nacional del comahue técnico para bioterios 2020-11-01 victoria harper female 37 3463 aristia april98@yahoo.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-11-01 cory davis male 19 3730 cabral jamie28@yahoo.com +univ. nacional del comahue medicina 2020-11-01 megan smith female 40 7201 colman corey28@hotmail.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-11-01 samantha harper female 17 1765 isidro casanova asmith@hotmail.com +univ. nacional del comahue arquitectura 2020-11-01 marissa gomez female 39 2718 lierra adjemiro jasminemorrison@yahoo.com +univ. nacional del comahue ingeniería electrónica 2020-11-02 nancy warren female 31 2347 colonia mackinlay ncook@gmail.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-11-02 sean weiss male 39 2916 el jupiter danarodriguez@gmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-11-02 jared farley male 31 7511 balneario oceano ujohnson@gmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-11-02 andrew berg male 18 3048 angeloni charlesgarcia@hotmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-11-02 darryl freeman male 31 9011 bahia langara lynchdenise@hotmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-11-02 william morgan male 35 8146 el rincon millsdustin@hotmail.com +univ. nacional del comahue medicina 2020-11-02 taylor harmon female 19 3322 aparicio cue peter57@hotmail.com +univ. nacional del comahue agronomía 2020-11-02 ashley mckinney female 18 3338 17 de agosto kdaniels@gmail.com +univ. nacional del comahue actuario 2020-11-02 alexander durham male 27 2352 ambrosetti alan12@hotmail.com +univ. nacional del comahue farmacia 2020-11-02 carl thomas male 36 3700 barrio gral jose de san martin otate@hotmail.com +univ. nacional del comahue licenciatura en administración 2020-11-02 scott young male 17 9013 cañadon seco steven97@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-11-03 joseph fischer male 17 6360 barrio el molino raymond31@yahoo.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-11-03 alejandra williams female 21 1842 el jaguel adam54@yahoo.com +univ. nacional del comahue diseño de imagen y sonido 2020-11-03 andrew walker male 17 9315 bajo caracoles diana62@yahoo.com +univ. nacional del comahue bioquímica 2020-11-03 robert scott male 29 6233 condarco jduke@yahoo.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-11-03 corey mccoy male 31 4178 abra rica dmiller@gmail.com +univ. nacional del comahue medicina 2020-11-03 brandy patterson female 21 3414 abra simpsonchristopher@yahoo.com +univ. nacional del comahue diseño industrial 2020-11-03 brent thomas male 21 2824 britos nancymiller@hotmail.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-11-03 lori young female 25 9050 gobernador moyano egarza@gmail.com +univ. nacional del comahue diseño de imagen y sonido 2020-11-03 david golden male 33 1804 canning lfoster@yahoo.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-11-03 taylor foley female 31 3470 arroyo grande andrewcox@hotmail.com +univ. nacional del comahue contador público 2020-11-03 emily rhodes female 27 8200 colonia lia y allende nicole72@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-11-03 stephen brown male 27 1712 castelar jennifer93@yahoo.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-11-03 daniel ford male 19 6746 cucha cucha justin96@gmail.com +univ. nacional del comahue ingeniería mecánica 2020-11-03 madison bailey female 37 5735 colonia bella vista shelly85@hotmail.com +univ. nacional del comahue agronomía 2020-11-04 kathy mills female 37 5365 el jumeal obuckley@hotmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-11-04 amy robinson female 35 6326 anguil sheila53@yahoo.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-11-04 kelly glenn female 23 2147 san genaro norte michaelrobinson@hotmail.com +univ. nacional del comahue licenciatura en sociología 2020-11-04 arthur rodriguez male 36 2105 cañada rica pamelagarcia@hotmail.com +univ. nacional del comahue licenciatura en sociología 2020-11-04 darrell robinson male 27 3016 san jose jamesschneider@hotmail.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-11-04 rebecca williams female 35 5383 agua colorada anthonybrown@yahoo.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-11-04 erica poole female 25 7313 16 de julio johnsonkenneth@gmail.com +univ. nacional del comahue bioquímica 2020-11-04 gina bright female 35 2751 almacen castro zoechambers@gmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-11-04 roger ferrell male 31 5573 colonia delfino wgallegos@gmail.com +univ. nacional del comahue ingeniería en informática 2020-11-04 joan baldwin female 19 6725 carmen de areco freyes@yahoo.com +univ. nacional del comahue licenciatura en musicoterapia 2020-11-04 ruben king male 21 4163 huasa pampa norte jordanterry@gmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-11-04 thomas bennett male 27 8324 cipolletti tara84@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-11-04 joshua brown male 36 8132 balneario chapalco fjones@yahoo.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-11-04 jamie porter female 27 3425 costa grande brandon55@gmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-11-04 amy hoover female 37 3248 caraguata hobbssabrina@gmail.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-11-04 kirk rios male 29 3350 apostoles kvaughn@hotmail.com +univ. nacional del comahue actuario 2020-11-04 michelle long female 29 5881 cañada la negra bowmanbrenda@hotmail.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-11-05 richard flores male 28 2342 campo el mataco gjohnson@yahoo.com +univ. nacional del comahue licenciatura en sociología 2020-11-05 nancy rodriguez female 27 4650 abra de peñas christinebarrett@hotmail.com +univ. nacional del comahue ingeniería en informática 2020-11-05 anthony morris male 39 3144 alcaraz 1ro nathanwaller@hotmail.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-11-05 rachel abbott female 33 3222 buen retiro barnesjustin@gmail.com +univ. nacional del comahue bioquímica 2020-11-05 robert garcia male 37 5511 general gutierrez spencerthomas@hotmail.com +univ. nacional del comahue licenciatura en psicología 2020-11-05 dennis freeman male 17 7305 antonio de los heros christopherramirez@gmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-11-05 christopher smith male 39 5306 carrizal mirandawalker@gmail.com +univ. nacional del comahue bioquímica 2020-11-05 bethany walton female 39 1657 11 de septiembre carla96@hotmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-11-05 bethany wolfe female 19 4713 ocho vados kimberlyelliott@hotmail.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-11-05 joshua boyd male 27 6634 alberti gerald01@hotmail.com +univ. nacional del comahue diseño industrial 2020-11-05 joshua stokes male 37 5701 11 de mayo jennifer73@gmail.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-11-05 wanda downs female 37 1613 los polvorines eharris@gmail.com +univ. nacional del comahue farmacia 2020-11-05 thomas moore male 29 8341 arroyo quillen stephaniebarron@yahoo.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-11-05 james golden male 35 5569 aguada kevinhess@gmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-11-06 robert hicks male 27 8521 arroyo de la ventana thall@yahoo.com +univ. nacional del comahue contador público 2020-11-06 kristen davis female 19 7226 gorchs anthonyjohnson@yahoo.com +univ. nacional del comahue técnico para bioterios 2020-11-06 richard smith male 21 1682 martin coronado annamartinez@yahoo.com +univ. nacional del comahue licenciatura en administración 2020-11-06 joe davis male 17 3229 colonia freitas carlaroberts@hotmail.com +univ. nacional del comahue medicina 2020-11-06 veronica flores female 27 5751 agua salada lisacollins@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-11-06 casey murphy male 37 3206 bella union paraje stephanie85@yahoo.com +univ. nacional del comahue ingeniería electrónica 2020-11-06 carlos garza male 33 3216 arroyo hondo hayneslarry@gmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-11-06 matthew thomas male 28 5325 alpasinche jglass@yahoo.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-11-06 margaret holt female 37 5615 25 de mayo garzaheather@gmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-11-06 lisa kaiser female 19 4741 agua de las palomas kennethflores@gmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-11-06 allen turner male 27 6628 colonia zambungo sethbrennan@gmail.com +univ. nacional del comahue agronomía 2020-11-07 michael young male 29 6203 el olivo kgillespie@yahoo.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-11-07 thomas lopez male 23 2240 campo garcia patriciafisher@hotmail.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-11-07 alyssa garza female 29 3450 8 de diciembre markballard@yahoo.com +univ. nacional del comahue medicina 2020-11-07 alicia ross female 37 3425 costa grande daniel83@hotmail.com +univ. nacional del comahue ingeniería mecánica 2020-11-07 manuel king male 35 4230 brea chimpana michelleperry@gmail.com +univ. nacional del comahue licenciatura en administración 2020-11-07 linda christensen female 24 3703 aleloy michellelambert@yahoo.com +univ. nacional del comahue arquitectura 2020-11-07 lori barrett female 35 9003 bahia solano briggsjeffery@hotmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-11-07 rebecca olson female 29 3589 kilometro 23 kimberly98@gmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-11-07 kyle harvey male 24 7630 hospital necochea villanuevajustin@yahoo.com +univ. nacional del comahue licenciatura en administración 2020-11-07 natalie williams female 33 7507 el bombero pbuck@hotmail.com +univ. nacional del comahue ingeniería electrónica 2020-11-07 michele rodriguez female 37 6009 san marcelo andradejeff@yahoo.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-11-07 beth brown female 25 2520 la california vjohnson@gmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-11-08 michele cuevas female 35 3405 algarrobal puisoye sweeneyrobert@yahoo.com +univ. nacional del comahue diseño industrial 2020-11-08 alicia ruiz female 21 8308 villa manzano sandra43@yahoo.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-11-08 thomas fletcher male 33 1826 remedios de escalada matthew98@gmail.com +univ. nacional del comahue contador público 2020-11-08 teresa smith female 18 8532 arroyo salado jeffrey58@hotmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-11-08 nicholas matthews male 21 2000 villa angelica michaelarellano@yahoo.com +univ. nacional del comahue licenciatura en administración 2020-11-08 christopher graves male 21 1852 burzaco keith86@hotmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-11-08 michael davis male 23 2813 arroyo de la cruz taylorprice@hotmail.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-11-08 jennifer livingston female 23 9053 aguada grande charles64@hotmail.com +univ. nacional del comahue licenciatura en administración 2020-11-09 kimberly harris female 27 5621 agua de torre wbrown@hotmail.com +univ. nacional del comahue ciencias veterinarias 2020-11-09 kristine coleman female 27 3412 albardon danacole@yahoo.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-11-09 christine fowler female 31 3203 arroyo grande saraday@gmail.com +univ. nacional del comahue licenciatura en sociología 2020-11-09 jerry velez male 28 3188 colonia falco gonzalezjeffery@yahoo.com +univ. nacional del comahue licenciatura en psicología 2020-11-09 christina smith female 37 2828 colonia nueva montevideo stephanie41@hotmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-11-09 christopher rodriguez male 23 6352 colonia la india ljones@yahoo.com +univ. nacional del comahue licenciatura en ciencia política 2020-11-09 michael smith male 21 1889 bosques melaniebradley@hotmail.com +univ. nacional del comahue bioquímica 2020-11-09 melinda gordon female 32 3344 2 de julio richardlozano@hotmail.com +univ. nacional del comahue actuario 2020-11-09 shelby pennington female 35 6703 alastuey christopher83@hotmail.com +univ. nacional del comahue arquitectura 2020-11-09 heather wilson female 17 6734 rawson bbrown@gmail.com +univ. nacional del comahue licenciatura en psicología 2020-11-09 lisa bonilla female 31 4631 antiguo allenwilliam@gmail.com +univ. nacional del comahue ciencias veterinarias 2020-11-10 richard banks male 23 5735 colonia bella vista wbaker@gmail.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-11-10 jeffrey martinez male 27 5577 el alto mariaross@gmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-11-10 sherry williams female 27 5427 apeadero quiroga mackthomas@yahoo.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-11-10 jose riley male 33 5557 caracoles hparker@gmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-11-10 alfred clark male 31 3448 alamo ekhan@hotmail.com +univ. nacional del comahue medicina 2020-11-10 stacy martinez female 37 1617 el talar david65@gmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-11-10 cindy ryan female 33 6031 de bruyn millererika@hotmail.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-11-10 connor gregory male 27 3222 buen retiro angela79@yahoo.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-11-10 bianca kent female 21 3733 campo el jacaranda gwalls@gmail.com +univ. nacional del comahue licenciatura en administración 2020-11-10 michelle smith female 33 6101 villa saboya smithanna@hotmail.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-11-10 brandon mack male 31 5329 amuschina knightjeffrey@yahoo.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-11-10 michelle bass female 23 6557 arboleda robert67@gmail.com +univ. nacional del comahue ingeniería electrónica 2020-11-10 michael boyd male 21 2173 campo pesoa emilychapman@gmail.com +univ. nacional del comahue diseño de imagen y sonido 2020-11-10 gary harper male 35 2255 campo rodriguez ccampbell@hotmail.com +univ. nacional del comahue licenciatura en administración 2020-11-11 steven evans male 27 8166 saldungaray armstrongbrandon@yahoo.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-11-11 jennifer mclean female 27 1702 ciudadela markanderson@yahoo.com +univ. nacional del comahue farmacia 2020-11-11 andrew williams male 31 4640 abra pampa samanthamiller@gmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-11-11 kyle allen male 21 6474 campo aristimuño christopher88@hotmail.com +univ. nacional del comahue agronomía 2020-11-11 lance ward male 17 3448 alamo natalie49@gmail.com +univ. nacional del comahue técnico para bioterios 2020-11-11 ryan berry male 33 9107 28 de julio robertsmith@gmail.com +univ. nacional del comahue actuario 2020-11-11 susan patterson female 23 2349 colonia dos rosas y la legua turneralicia@hotmail.com +univ. nacional del comahue licenciatura en psicología 2020-11-12 michael arellano male 31 3309 arroyo tomas reidkayla@hotmail.com +univ. nacional del comahue diseño de imagen y sonido 2020-11-12 madison brennan female 33 3100 avenida ejercito parana christophersmith@hotmail.com +univ. nacional del comahue licenciatura en artes 2020-11-12 michelle harris female 33 8187 bordenave david24@yahoo.com +univ. nacional del comahue licenciatura en psicología 2020-11-12 michael oliver male 17 3592 colonia hardy bbush@yahoo.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-11-12 darin perez male 21 3575 arroyo ceibal allisonking@gmail.com +univ. nacional del comahue licenciatura en artes 2020-11-12 joseph thomas male 19 3132 el pingo williamsmary@yahoo.com +univ. nacional del comahue licenciatura en administración 2020-11-12 cynthia clark female 35 3400 bañado norte kclark@gmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-11-12 gordon hunter male 27 2915 aguirrezabala collinswendy@gmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-11-12 renee day female 40 9001 cañadon ferrais wblack@gmail.com +univ. nacional del comahue ingeniería electrónica 2020-11-12 amy frank female 25 2944 rio tala qcook@hotmail.com +univ. nacional del comahue ingeniería en informática 2020-11-12 ryan espinoza male 37 3016 san jose torreschristina@yahoo.com +univ. nacional del comahue ingeniería electrónica 2020-11-12 tabitha garcia female 29 3081 cavour lmcdonald@hotmail.com +univ. nacional del comahue agronomía 2020-11-12 brenda king female 21 2324 colonia tacurales jonathan60@gmail.com +univ. nacional del comahue ciencias veterinarias 2020-11-12 michelle roberts female 21 9207 arroyo guilaia martinjames@yahoo.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-11-13 patrick allen male 17 5585 el cipres gscott@yahoo.com +univ. nacional del comahue diseño industrial 2020-11-13 melissa krueger female 19 2943 ireneo portela johnhogan@yahoo.com +univ. nacional del comahue farmacia 2020-11-13 michael jacobs male 25 2248 bernardo de irigoyen brian58@yahoo.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-11-13 ashley green female 25 2527 colonia san francisco christian68@yahoo.com +univ. nacional del comahue licenciatura en ciencia política 2020-11-13 dorothy ward female 19 4151 bajo de los sueldos harperchristine@hotmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-11-13 corey arroyo male 35 4101 agua negra fsmith@hotmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-11-13 joseph yang male 31 6339 cailomuta rossraymond@gmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-11-13 vickie davis female 33 6438 masurel hartjulie@gmail.com +univ. nacional del comahue bioquímica 2020-11-13 jesse kent male 19 1884 berazategui hansonmaria@yahoo.com +univ. nacional del comahue diseño de imagen y sonido 2020-11-13 janet white female 23 4111 aguada qgibson@yahoo.com +univ. nacional del comahue contador público 2020-11-13 nicole murray female 20 7612 camet cadams@hotmail.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-11-13 joseph larsen male 28 2170 candelaria sud marymartinez@hotmail.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-11-13 nancy hughes female 23 5442 ambas puntillas evancooper@yahoo.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-11-13 lacey lawrence female 31 8534 aguada cecilio nguyenbrenda@yahoo.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-11-13 jessica delacruz female 21 2322 cabaña el cisne martinhunt@yahoo.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-11-13 adam moore male 29 1665 jose clemente paz brandon66@hotmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-11-13 rodney thompson male 30 3453 ifran urobertson@hotmail.com +univ. nacional del comahue diseño industrial 2020-11-13 david johnson male 35 7535 pontaut eric52@yahoo.com +univ. nacional del comahue ciencias veterinarias 2020-11-13 nancy colon female 35 2303 angelica nicole14@hotmail.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-11-14 david todd male 33 2407 campo clucellas shawn12@hotmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-11-14 theresa joseph female 33 3100 avenida ejercito parana rodriguezrhonda@yahoo.com +univ. nacional del comahue farmacia 2020-11-14 jacob hodges male 27 9400 an aike robert74@gmail.com +univ. nacional del comahue contador público 2020-11-14 debra taylor female 39 6228 aguas buenas cburgess@hotmail.com +univ. nacional del comahue contador público 2020-11-14 ann edwards female 33 6383 campo moises seccion 1a walkerpeter@hotmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-11-14 sonia foster female 23 6000 barrio carosio youngjeffery@gmail.com +univ. nacional del comahue licenciatura en administración 2020-11-14 rebecca johnson female 20 6723 cucullu david74@hotmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-11-14 wesley murray male 31 6000 barrio carosio wpace@gmail.com +univ. nacional del comahue ingeniería electrónica 2020-11-14 megan nelson female 23 2635 cañada del ucle jason60@yahoo.com +univ. nacional del comahue agronomía 2020-11-14 scott barry male 29 6614 franklin vmartin@yahoo.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-11-15 brittany adams female 21 8307 colonia gobernador ayala clairebutler@hotmail.com +univ. nacional del comahue ingeniería electrónica 2020-11-15 zachary pacheco male 38 3466 abalo zhardy@yahoo.com +univ. nacional del comahue diseño industrial 2020-11-15 beth stewart female 31 2529 piamonte fgregory@hotmail.com +univ. nacional del comahue actuario 2020-11-15 julia mcgee female 29 8305 aguada san roque millerrhonda@gmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-11-15 glenn burns male 21 3144 alcaraz 1ro umartinez@yahoo.com +univ. nacional del comahue técnico para bioterios 2020-11-15 elizabeth rodriguez female 33 2942 baradero tiffanymoses@yahoo.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-11-15 robert young male 33 2349 colonia dos rosas y la legua troy50@yahoo.com +univ. nacional del comahue diseño de imagen y sonido 2020-11-15 jasmine stein female 27 2405 colonia cello jhester@yahoo.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-11-15 kara adams female 39 5473 aguayo lisa26@gmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-11-16 richard jacobs male 21 1911 bme bavio gral mansilla jennifer18@yahoo.com +univ. nacional del comahue bioquímica 2020-11-16 elizabeth wang female 35 6213 lote 11 escuela 107 jaime22@hotmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-11-16 amy powell female 31 2852 alarcon bethwalker@gmail.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-11-16 michael baxter male 19 5584 barrio villa adela gregory78@hotmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-11-16 stacey spears female 27 7009 iraola robert87@yahoo.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-11-16 daniel cobb male 25 6434 palantelen salvarado@gmail.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-11-16 ashley mack female 33 3357 barra bonita watersmelissa@hotmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-11-16 tracy johnson female 17 8336 gobernador duval rebecca95@gmail.com +univ. nacional del comahue licenciatura en administración 2020-11-16 james parker male 31 1702 ciudadela jessica21@hotmail.com +univ. nacional del comahue contador público 2020-11-16 ashley diaz female 23 8431 el hoyo brianfitzgerald@hotmail.com +univ. nacional del comahue ingeniería mecánica 2020-11-17 adriana hernandez female 31 5345 baños termales kimberlymiller@hotmail.com +univ. nacional del comahue técnico para bioterios 2020-11-17 jason ford male 21 5460 agua de la zorra joneskevin@gmail.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-11-17 jonathan brown male 19 7108 costa del este laurie15@gmail.com +univ. nacional del comahue medicina 2020-11-17 abigail caldwell female 37 2700 barrio trocha markgrant@yahoo.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-11-17 timothy payne male 39 9201 cachel vanessagarcia@gmail.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-11-17 michael kim male 17 3722 2 de mayo nschroeder@yahoo.com +univ. nacional del comahue arquitectura 2020-11-17 shelly gentry female 19 9011 bahia langara nathangarcia@gmail.com +univ. nacional del comahue diseño industrial 2020-11-17 jennifer dunn female 29 6407 girodias john08@hotmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-11-17 rebecca velazquez female 29 5759 calera argentina meganlloyd@hotmail.com +univ. nacional del comahue ciencias veterinarias 2020-11-18 paul livingston male 19 9041 los antiguos lgarcia@yahoo.com +univ. nacional del comahue ciencias veterinarias 2020-11-18 james travis male 17 6385 arata palmermatthew@gmail.com +univ. nacional del comahue licenciatura en sociología 2020-11-18 tyler odom male 33 3474 chavarria ncarter@gmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-11-18 christopher sandoval male 19 6660 25 de mayo kyle46@gmail.com +univ. nacional del comahue actuario 2020-11-18 john thompson male 39 5465 baños pismanta fletcherkyle@hotmail.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-11-18 chad jordan male 31 3226 buena vista kathy90@gmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-11-18 timothy winters male 33 7511 balneario oceano brockmark@yahoo.com +univ. nacional del comahue diseño de imagen y sonido 2020-11-19 jennifer wilson female 27 2415 desvio boero kelly65@hotmail.com +univ. nacional del comahue medicina 2020-11-19 theresa anderson female 29 6003 ascencion agreene@yahoo.com +univ. nacional del comahue licenciatura en artes 2020-11-19 harold mason male 37 1925 destileria fiscal deanthomas@yahoo.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-11-19 rachael ramirez female 33 6463 alagon jerry93@gmail.com +univ. nacional del comahue licenciatura en artes 2020-11-19 jordan anderson female 18 7249 el araza gberry@yahoo.com +univ. nacional del comahue diseño de imagen y sonido 2020-11-19 sandra hernandez female 29 3485 carandaiti lijacob@yahoo.com +univ. nacional del comahue licenciatura en musicoterapia 2020-11-19 cynthia castillo female 17 2111 francisco paz shaffertravis@hotmail.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-11-19 pamela benjamin female 33 1651 san andres adriana75@hotmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-11-19 cynthia holloway female 23 5343 lavalle blaircaleb@hotmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-11-19 sharon adams female 19 5773 cañada amanda92@hotmail.com +univ. nacional del comahue ingeniería en informática 2020-11-19 melissa robertson female 29 7630 hospital necochea josephking@gmail.com +univ. nacional del comahue técnico para bioterios 2020-11-19 dorothy garner female 17 9039 hito 45 daniel36@gmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-11-19 harry warren male 27 7303 altona malik20@gmail.com +univ. nacional del comahue ciencias veterinarias 2020-11-19 william hodges male 25 3174 altamirano sud james78@yahoo.com +univ. nacional del comahue medicina 2020-11-19 dustin boyd male 39 2146 clason cherylschmidt@yahoo.com +univ. nacional del comahue diseño industrial 2020-11-20 michelle harris female 33 7261 saladillo norte martinezjohn@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-11-20 debra kirk female 19 5555 puente del inca tdavis@hotmail.com +univ. nacional del comahue agronomía 2020-11-20 sheri ross female 17 4750 agua colorada millerana@hotmail.com +univ. nacional del comahue actuario 2020-11-20 daniel klein male 19 5327 capihuas jdavis@gmail.com +univ. nacional del comahue actuario 2020-11-20 robin hughes female 37 5632 colonia alvear thorntonjames@gmail.com +univ. nacional del comahue diseño de imagen y sonido 2020-11-20 david morales male 31 2846 anahi frobinson@gmail.com +univ. nacional del comahue farmacia 2020-11-20 james reed male 24 3641 arroyo seco ebarrett@hotmail.com +univ. nacional del comahue ingeniería en informática 2020-11-20 richard tyler male 33 4512 agua negra shane42@gmail.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-11-20 stephanie murphy female 25 8503 chocori dduncan@yahoo.com +univ. nacional del comahue licenciatura en administración 2020-11-20 troy johnson male 17 6625 cañada la rica lisa42@hotmail.com +univ. nacional del comahue licenciatura en administración 2020-11-20 chelsea hatfield female 25 4740 agua salada alexismarshall@gmail.com +univ. nacional del comahue ciencias veterinarias 2020-11-21 frank miller male 29 5357 el horno ephillips@gmail.com +univ. nacional del comahue licenciatura en artes 2020-11-21 francis bell male 20 4135 caspinchango xbrooks@hotmail.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-11-21 amanda hines female 32 7607 balneario atlantida bensonmichael@gmail.com +univ. nacional del comahue ingeniería electrónica 2020-11-21 rebecca carter female 25 7635 el lenguaraz eric78@yahoo.com +univ. nacional del comahue actuario 2020-11-21 donna clark female 39 6505 dudignac sanchezrebecca@hotmail.com +univ. nacional del comahue medicina 2020-11-21 carrie davis female 17 4158 campo de talamayo zkhan@gmail.com +univ. nacional del comahue actuario 2020-11-21 amber edwards female 25 2315 estacion saguier dunnwilliam@gmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-11-21 dennis barnes male 23 1882 ezpeleta este youngaaron@gmail.com +univ. nacional del comahue ingeniería mecánica 2020-11-21 carla long female 33 5340 agua grande danieldavidson@gmail.com +univ. nacional del comahue licenciatura en administración 2020-11-21 nicholas maynard male 33 3734 campo moreno ddavis@hotmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-11-22 valerie sanders female 28 1667 manuel alberti jeffreysmith@gmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-11-22 debra price female 29 5609 aristides villanueva williamhorn@hotmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-11-22 nicole garcia female 29 4632 antumpa danielle04@gmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-11-22 elizabeth ortiz female 39 4626 angosto del perchel vscott@hotmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-11-22 karla anderson female 24 5575 andrade fcabrera@hotmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-11-22 daniel roberts male 21 1651 san andres xmorris@yahoo.com +univ. nacional del comahue diseño industrial 2020-11-22 cory kelly male 17 7507 el bombero russellamy@gmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-11-22 chris miller male 31 8340 aguada florencio caseysharon@yahoo.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-11-22 michelle mora female 31 5507 baños lunlunta smithalan@yahoo.com +univ. nacional del comahue técnico para bioterios 2020-11-22 matthew colon male 35 6213 lote 11 escuela 107 piercenicolas@gmail.com +univ. nacional del comahue diseño de imagen y sonido 2020-11-23 alan scott male 27 3029 colonia adolfo alsina bowmandouglas@gmail.com +univ. nacional del comahue contador público 2020-11-23 jason scott male 25 5615 25 de mayo cherylgoodwin@yahoo.com +univ. nacional del comahue contador público 2020-11-23 michael nguyen male 29 6073 el triunfo bryan31@gmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-11-23 tammy smith female 31 6743 coliqueo ylee@hotmail.com +univ. nacional del comahue arquitectura 2020-11-23 christopher garcia male 40 1602 florida hollandalexander@hotmail.com +univ. nacional del comahue contador público 2020-11-23 jason james male 39 3574 capilla guadalupe norte nicholas57@gmail.com +univ. nacional del comahue licenciatura en psicología 2020-11-23 donna chapman female 39 3224 la blanqueada scottherrera@gmail.com +univ. nacional del comahue ingeniería electrónica 2020-11-23 david miller male 17 3048 angeloni ptran@yahoo.com +univ. nacional del comahue ingeniería mecánica 2020-11-24 amanda vaughn female 29 7261 saladillo norte christophercoleman@gmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-11-24 fernando munoz male 35 7136 adela macdonaldsarah@hotmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-11-24 cameron may male 37 8126 aldea san andres ldean@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-11-24 april burns female 21 1748 general rodriguez rcarr@yahoo.com +univ. nacional del comahue agronomía 2020-11-24 mike peterson male 19 4612 carahunco john90@hotmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-11-24 benjamin rice male 27 2443 colonia margarita ljenkins@gmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-11-24 john roberts male 31 2123 campo calvo hernandezalexander@yahoo.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-11-24 rebekah gonzales female 31 7609 balneario la caleta mterry@yahoo.com +univ. nacional del comahue licenciatura en administración 2020-11-24 jared dominguez male 25 6475 esteban de luca lopezkimberly@hotmail.com +univ. nacional del comahue diseño de imagen y sonido 2020-11-24 gerald moore male 28 1890 juan maria gutierrez jeffery98@gmail.com +univ. nacional del comahue arquitectura 2020-11-24 amy flores female 31 2848 berisso yrodriguez@hotmail.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-11-25 ray cervantes male 37 2183 arequito jimmy39@gmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-11-25 keith neal male 17 3045 campo zavalla dvelez@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-11-25 shannon sandoval female 23 2440 barrio belgrano ortiz rothrebecca@gmail.com +univ. nacional del comahue diseño industrial 2020-11-25 james taylor male 23 1633 empalme torresmegan@gmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-11-25 edward miller male 39 5773 cañada ebailey@hotmail.com +univ. nacional del comahue ingeniería en informática 2020-11-25 shelly frazier female 19 2117 alcorta sylvia45@hotmail.com +univ. nacional del comahue farmacia 2020-11-25 david moore male 19 8162 garcia del rio melissalambert@yahoo.com +univ. nacional del comahue licenciatura en sociología 2020-11-25 latasha cook female 35 1665 jose clemente paz derek68@gmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-11-25 teresa montoya female 28 2183 arequito jasondrake@gmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-11-25 thomas becker male 23 5345 baños termales vsmith@hotmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-11-25 david harris male 31 3485 carandaiti patriciacoleman@yahoo.com +univ. nacional del comahue licenciatura en artes 2020-11-26 jesse steele male 25 2761 estancia santa catalina usanchez@yahoo.com +univ. nacional del comahue licenciatura en sociología 2020-11-26 heather smith female 23 3287 aldea san gregorio kathleenbennett@gmail.com +univ. nacional del comahue farmacia 2020-11-26 stephen goodman male 26 6321 caichue david38@hotmail.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-11-26 kayla watkins female 18 5444 ampacama michaelduncan@yahoo.com +univ. nacional del comahue diseño industrial 2020-11-26 matthew dixon male 19 3572 campo garabato howardalexandra@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-11-26 sandra miller female 25 8118 cabildo susan84@hotmail.com +univ. nacional del comahue licenciatura en artes 2020-11-26 james suarez male 27 3057 estancia las gamas lrogers@hotmail.com +univ. nacional del comahue ciencias veterinarias 2020-11-26 nathan james male 35 9411 base aerea teniente matienzo nathanielporter@hotmail.com +univ. nacional del comahue licenciatura en administración 2020-11-26 brett harper male 25 1661 bella vista lkidd@gmail.com +univ. nacional del comahue farmacia 2020-11-26 nicole smith female 33 5438 alto de sierra hollymedina@yahoo.com +univ. nacional del comahue ingeniería en informática 2020-11-26 thomas richardson male 35 8133 la rosa lhughes@gmail.com +univ. nacional del comahue técnico para bioterios 2020-11-26 olivia molina female 24 5541 algarrobal abajo leewells@yahoo.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-11-27 christopher daniels male 23 2311 adolfo alsina shannonpeterson@yahoo.com +univ. nacional del comahue medicina 2020-11-27 terri kim female 19 7407 libano emarshall@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-11-27 anthony george male 33 8536 chipauquil john53@gmail.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-11-27 rodney cooper male 27 5622 colonia jauregui tochoa@yahoo.com +univ. nacional del comahue ciencias veterinarias 2020-11-27 maureen clarke female 25 2630 firmat patrickgray@gmail.com +univ. nacional del comahue ingeniería mecánica 2020-11-27 kenneth hill male 37 5363 anguinan christopherwright@gmail.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-11-27 kayla rodriguez female 21 2138 carcaraña nicholas59@yahoo.com +univ. nacional del comahue licenciatura en psicología 2020-11-27 daniel thomas male 31 1727 b los aromos san patricio sjohnson@gmail.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-11-27 timothy mitchell male 37 5549 agua de los manantiales ubarnes@hotmail.com +univ. nacional del comahue medicina 2020-11-27 stephanie stewart female 33 6305 atreuco arnoldcraig@yahoo.com +univ. nacional del comahue licenciatura en musicoterapia 2020-11-27 elizabeth gates female 28 5421 la tranca timothyking@yahoo.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-11-27 joseph knight male 25 6345 la bilbaina debraluna@gmail.com +univ. nacional del comahue técnico para bioterios 2020-11-27 megan hamilton female 37 5533 9 de julio sheltonlacey@gmail.com +univ. nacional del comahue arquitectura 2020-11-27 joshua carroll male 31 6461 capitan castro joann70@hotmail.com +univ. nacional del comahue arquitectura 2020-11-27 matthew norris male 25 3474 chavarria torressamantha@yahoo.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-11-27 brian murray male 37 5359 alto jaguel barnesjeremy@gmail.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-11-27 sophia hart female 23 2187 arteaga louisgreer@hotmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-11-28 brian ross male 37 9023 buen pasto aedwards@yahoo.com +univ. nacional del comahue ciencias veterinarias 2020-11-28 kelsey decker female 35 1659 campo de mayo awilliams@yahoo.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-11-28 susan green female 37 9217 cholila donna60@yahoo.com +univ. nacional del comahue diseño industrial 2020-11-28 felicia foley female 25 6550 bolivar hlloyd@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-11-28 jessica holmes female 29 3581 campo redondo iortiz@gmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-11-28 samantha garcia female 37 2144 campo horquesco hendrixraymond@yahoo.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-11-28 karen conner female 33 5345 baños termales markwilson@yahoo.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-11-28 dalton williams male 39 6105 cañada seca emily56@yahoo.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-11-28 kevin ramirez male 17 8315 achico pbridges@hotmail.com +univ. nacional del comahue diseño de imagen y sonido 2020-11-28 hunter baker male 25 4149 alpachiri aliciareilly@hotmail.com +univ. nacional del comahue licenciatura en artes 2020-11-28 diana foster female 23 4111 aguada clynch@hotmail.com +univ. nacional del comahue ingeniería mecánica 2020-11-28 bruce walker male 33 3540 avanzada acostachelsea@hotmail.com +univ. nacional del comahue ingeniería electrónica 2020-11-28 amber aguilar female 17 4195 7 de abril gonzalezhannah@gmail.com +univ. nacional del comahue agronomía 2020-11-28 jennifer jones female 23 3052 cañadita gjohnson@gmail.com +univ. nacional del comahue diseño industrial 2020-11-29 ian williams male 29 2812 capilla del señor saragarcia@yahoo.com +univ. nacional del comahue diseño industrial 2020-11-29 paul sims male 29 6628 colonia zambungo brandidalton@hotmail.com +univ. nacional del comahue diseño de imagen y sonido 2020-11-29 crystal gray female 27 4618 abra de pives jeanetteleonard@gmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-11-29 brian edwards male 21 8508 ambrosio p lezica bernardbrian@gmail.com +univ. nacional del comahue licenciatura en psicología 2020-11-29 denise guzman female 29 2713 manuel ocampo andrewssamuel@yahoo.com +univ. nacional del comahue licenciatura en ciencia política 2020-11-29 ana key female 21 6616 castilla ramossteven@gmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-11-29 william cortez male 21 8360 buena esperanza katherine29@yahoo.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-11-29 gary miller male 31 5411 la legua usmith@gmail.com +univ. nacional del comahue actuario 2020-11-29 david dillon male 33 5276 baldes de pacheco bergerashley@gmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-11-29 jennifer hancock female 39 3338 17 de agosto jesus07@hotmail.com +univ. nacional del comahue bioquímica 2020-11-29 jordan hansen female 39 5636 favelli youngcynthia@yahoo.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-11-29 ronald lewis male 19 8113 baterias stephanie00@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-11-29 nancy clark female 31 7167 carilo matthew84@hotmail.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-11-29 daniel cervantes male 17 1771 mercado central freemanerica@yahoo.com +univ. nacional del comahue licenciatura en administración 2020-11-30 michael price male 32 2743 arroyo dulce shernandez@hotmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-11-30 michael whitaker male 35 8200 colonia lia y allende patrick36@yahoo.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-11-30 peter richard male 35 4237 cortaderas freemanjonathan@hotmail.com +univ. nacional del comahue farmacia 2020-11-30 alexis smith female 21 3585 el sombrerito allentiffany@hotmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-11-30 pamela myers female 24 6471 atahualpa powellalexander@yahoo.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-11-30 nicholas freeman male 35 4626 angosto del perchel amandasexton@gmail.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-11-30 jeff rice male 29 5319 colpes jennifer21@hotmail.com +univ. nacional del comahue agronomía 2020-11-30 charles smith male 39 9301 el chalten richard35@yahoo.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-11-30 maria jones female 37 3263 1 de mayo yatespaula@yahoo.com +univ. nacional del comahue licenciatura en musicoterapia 2020-11-30 adam caldwell male 23 6660 25 de mayo mooredavid@hotmail.com +univ. nacional del comahue medicina 2020-11-30 gilbert smith male 37 2705 haras san jacinto eric84@hotmail.com +univ. nacional del comahue licenciatura en sociología 2020-11-30 keith richardson male 19 3540 avanzada mjohnson@yahoo.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-11-30 daniel park male 19 8200 colonia lia y allende gcole@hotmail.com +univ. nacional del comahue agronomía 2020-11-30 steven rodgers male 28 4137 abra baya erivera@gmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-11-30 julie carter female 33 9020 arroyo quilla mwilkerson@hotmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-11-30 kimberly kent female 23 3176 estacion sola rodriguezkenneth@yahoo.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-12-01 samuel reyes male 31 8313 arroyito timguerra@yahoo.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-12-01 courtney johnson female 21 3013 colonia matilde vmitchell@hotmail.com +univ. nacional del comahue ingeniería electrónica 2020-12-01 thomas meyers male 35 5601 capitan montoya nicholasblankenship@gmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-12-01 terry white male 19 5722 acasape graydevin@hotmail.com +univ. nacional del comahue contador público 2020-12-01 michael hunter male 18 1718 san antonio de padua mark05@yahoo.com +univ. nacional del comahue arquitectura 2020-12-01 rhonda green female 21 4431 aguas calientes chaseantonio@hotmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-12-01 timothy williams male 21 9003 bahia solano karen79@yahoo.com +univ. nacional del comahue ingeniería mecánica 2020-12-01 kathleen hawkins female 19 3003 colonia los zapallos campbellkevin@gmail.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-12-01 nathan brown male 21 1746 francisco alvarez danielle73@hotmail.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-12-01 linda harris female 25 3048 angeloni hpatton@gmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-12-01 christian castillo male 23 3001 alto verde christinawest@yahoo.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-12-01 amber perkins female 23 4612 carahunco nharris@yahoo.com +univ. nacional del comahue ciencias veterinarias 2020-12-01 kelly nicholson female 34 6214 casimiro gomez daniel55@hotmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-12-02 mark wright male 38 5750 alto de la leña austin71@yahoo.com +univ. nacional del comahue actuario 2020-12-02 jason harper male 33 5460 agua de la zorra uwright@gmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-12-02 tanner abbott male 19 1744 cuartel v wcrawford@hotmail.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-12-02 jared scott male 25 3358 cheroguita lpalmer@yahoo.com +univ. nacional del comahue licenciatura en musicoterapia 2020-12-02 carl lopez male 19 6341 chapi talo alexyoung@hotmail.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-12-02 autumn black female 23 6476 chiclana hjones@yahoo.com +univ. nacional del comahue licenciatura en ciencia política 2020-12-02 michelle campbell female 39 5592 el carbalino hward@yahoo.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-12-02 jay ellis male 39 7305 antonio de los heros smithjessica@gmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-12-03 peggy adams female 35 7163 claverie deborahsmith@yahoo.com +univ. nacional del comahue diseño industrial 2020-12-03 sandra burton female 19 4500 alto del saladillo kleinlauren@gmail.com +univ. nacional del comahue agronomía 2020-12-03 megan wright female 23 8363 colonia josefa linda63@hotmail.com +univ. nacional del comahue licenciatura en administración 2020-12-03 richard foster male 28 7223 bonnement michaelbuchanan@yahoo.com +univ. nacional del comahue licenciatura en ciencia política 2020-12-03 emily ramirez female 33 2258 campo quiñones tayloramber@yahoo.com +univ. nacional del comahue licenciatura en artes 2020-12-03 alexandra miller female 18 1864 alejandro korn johnsonshane@yahoo.com +univ. nacional del comahue diseño de imagen y sonido 2020-12-03 mark dudley male 39 6203 el olivo don55@yahoo.com +univ. nacional del comahue medicina 2020-12-03 deanna hill female 37 1739 general hornos vmoyer@gmail.com +univ. nacional del comahue ciencias veterinarias 2020-12-03 christopher hall male 37 2752 almacen el descanso caleb43@gmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-12-04 krystal velasquez female 31 3555 campo huber ggutierrez@yahoo.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-12-04 daniel clarke male 23 6239 gonzalez moreno vshepard@yahoo.com +univ. nacional del comahue ingeniería mecánica 2020-12-04 travis ward male 23 8212 abramo ocooper@hotmail.com +univ. nacional del comahue arquitectura 2020-12-04 stephen harrington male 31 6307 colonia la oracion francesmiles@gmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-12-04 olivia melton female 29 7160 la union twatkins@gmail.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-12-04 gerald west male 33 6000 barrio carosio lopezdestiny@gmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-12-04 carol white female 25 3532 curandu james89@gmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-12-04 steven watts male 33 9003 bahia solano ejenkins@hotmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-12-04 marissa henderson female 38 7260 barrio villa saladillo gchambers@yahoo.com +univ. nacional del comahue actuario 2020-12-04 kathy evans female 39 5409 adan quiroga carriehernandez@yahoo.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-12-04 danielle herrera female 33 2512 campo charo johnwebb@gmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-12-04 alice moore female 33 3177 altamirano norte eshields@hotmail.com +univ. nacional del comahue ingeniería en informática 2020-12-05 deborah nguyen female 23 4501 abra del trigo qscott@yahoo.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-12-05 rebecca orozco female 17 1915 arbuco zfreeman@hotmail.com +univ. nacional del comahue licenciatura en psicología 2020-12-05 jonathan ashley male 19 4707 chañarcito steven16@hotmail.com +univ. nacional del comahue licenciatura en sociología 2020-12-05 michael hubbard male 25 3133 arroyo burgos taylorsolomon@yahoo.com +univ. nacional del comahue licenciatura en psicología 2020-12-05 cody kramer male 37 7601 barrio batan whitejeffery@gmail.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-12-05 nathan graham male 29 1804 canning collinscindy@hotmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-12-05 holly lewis female 21 3188 colonia falco gordonjames@hotmail.com +univ. nacional del comahue licenciatura en artes 2020-12-05 heather mills female 31 3351 azara rchavez@yahoo.com +univ. nacional del comahue técnico para bioterios 2020-12-05 lori cook female 35 5722 acasape popejason@yahoo.com +univ. nacional del comahue ingeniería mecánica 2020-12-05 matthew carter male 35 6616 castilla ooconnor@gmail.com +univ. nacional del comahue arquitectura 2020-12-05 christopher harper male 37 1871 dock sud aarnold@gmail.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-12-05 ryan gonzalez male 27 4166 balderrama martinezmark@yahoo.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-12-05 april velasquez female 25 5276 baldes de pacheco francissara@gmail.com +univ. nacional del comahue licenciatura en artes 2020-12-06 jason barnett male 33 9030 rio mayo robertgray@gmail.com +univ. nacional del comahue ciencias veterinarias 2020-12-06 tammy jimenez female 39 1804 canning harrischristina@hotmail.com +univ. nacional del comahue ciencias veterinarias 2020-12-06 nicholas morgan male 23 2301 bella italia robertsummers@gmail.com +univ. nacional del comahue diseño industrial 2020-12-06 steven mccall male 25 2848 berisso vgarrett@yahoo.com +univ. nacional del comahue ciencias veterinarias 2020-12-06 charles schmidt male 31 5401 barrio el tontal susanhurley@hotmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-12-06 david santana male 37 6317 la florencia rebeccajohnson@hotmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-12-06 jack kennedy male 19 3180 diego lopez alexandranolan@hotmail.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-12-06 courtney cunningham female 17 5461 aguada de la peña jacqueline49@gmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-12-06 brian valencia male 26 5707 aguaditas collierbrian@hotmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-12-06 john williams male 35 2324 colonia tacurales dawn87@gmail.com +univ. nacional del comahue contador público 2020-12-06 walter meyer male 38 5633 ochenta y cuatro jeremy45@hotmail.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-12-06 heidi hernandez female 31 7011 aneque grande kathleenbaker@hotmail.com +univ. nacional del comahue ciencias veterinarias 2020-12-06 sergio pearson male 19 3197 abra guazu susan89@yahoo.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-12-06 david frank male 33 4168 agua blanca anthony45@gmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-12-07 angela willis female 25 8512 igarzabal mnewton@gmail.com +univ. nacional del comahue licenciatura en sociología 2020-12-07 phillip richardson male 33 3216 arroyo hondo uholmes@gmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-12-07 olivia patterson female 31 1885 guillermo e hudson patricia85@yahoo.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-12-07 nancy wall female 21 7113 la lucila del mar mcintoshlindsay@yahoo.com +univ. nacional del comahue licenciatura en musicoterapia 2020-12-07 joann gibson female 33 1893 centro agricola el pato rebeccaallen@gmail.com +univ. nacional del comahue agronomía 2020-12-07 melissa hogan female 39 4601 corral de piedras jesus78@gmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-12-07 suzanne mcdaniel female 33 9303 cañadon del toro sarah44@yahoo.com +univ. nacional del comahue medicina 2020-12-07 michael ramos male 39 1865 el pampero eileen73@hotmail.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-12-07 renee pena female 39 5770 chacras viejas perryjames@hotmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-12-08 charles jones male 22 5733 cramer melissa41@yahoo.com +univ. nacional del comahue licenciatura en psicología 2020-12-08 monica wilson female 19 5757 san lorenzo clifford69@yahoo.com +univ. nacional del comahue licenciatura en sociología 2020-12-08 angela greer female 33 7633 maori edwinmarshall@gmail.com +univ. nacional del comahue farmacia 2020-12-08 nichole lopez female 39 7621 la sara kimberlylyons@yahoo.com +univ. nacional del comahue licenciatura en psicología 2020-12-08 melinda howard female 39 5449 aguango jessicabrooks@gmail.com +univ. nacional del comahue ingeniería electrónica 2020-12-08 tiffany kim female 19 3474 chavarria wrightkristopher@yahoo.com +univ. nacional del comahue ingeniería en informática 2020-12-09 jeremy fernandez male 32 3260 arroyo molino pattondebra@yahoo.com +univ. nacional del comahue actuario 2020-12-09 brandy ruiz female 17 5435 algarrobo grande andrewmcbride@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-12-09 patricia lee female 29 5587 barcala nanderson@yahoo.com +univ. nacional del comahue medicina 2020-12-09 rebecca sweeney female 29 6433 arturo vatteone ehernandez@hotmail.com +univ. nacional del comahue licenciatura en sociología 2020-12-09 jane smith female 19 9203 aldea escolar arnoldzachary@yahoo.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-12-09 ronald hicks male 31 5460 agua de la zorra jerrymartin@yahoo.com +univ. nacional del comahue diseño de imagen y sonido 2020-12-09 joel owen male 27 6409 jose maria blanco kevinsalas@yahoo.com +univ. nacional del comahue técnico para bioterios 2020-12-09 arthur jenkins male 29 4182 campo la flor los ralos thompsonmark@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-12-09 tony green male 31 6601 altamira baxterkristina@yahoo.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-12-10 brittany stewart female 29 9030 rio mayo hernandeznicole@yahoo.com +univ. nacional del comahue diseño industrial 2020-12-10 colleen martin female 23 1770 aldo bonzi blakemaureen@yahoo.com +univ. nacional del comahue medicina 2020-12-10 joshua bailey male 19 7153 cangallo davidjones@gmail.com +univ. nacional del comahue diseño industrial 2020-12-10 matthew allison male 19 2252 colonia campo piaggio owilliams@yahoo.com +univ. nacional del comahue ingeniería mecánica 2020-12-10 melanie williams female 29 1885 guillermo e hudson matthew37@gmail.com +univ. nacional del comahue agronomía 2020-12-10 kathryn allen female 27 2185 campo crenna eatonbrooke@hotmail.com +univ. nacional del comahue bioquímica 2020-12-10 scott george male 33 2843 general galarza brittany55@hotmail.com +univ. nacional del comahue ingeniería mecánica 2020-12-10 kevin molina male 23 3470 arroyo grande rriggs@yahoo.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-12-10 martha ferrell female 37 3592 colonia hardy bbeasley@hotmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-12-10 hannah nichols female 19 1987 alegre qallen@yahoo.com +univ. nacional del comahue ciencias veterinarias 2020-12-10 allison smith female 31 5615 25 de mayo robert42@gmail.com +univ. nacional del comahue farmacia 2020-12-10 joseph watkins male 21 4145 ingenio la providencia nicolecalhoun@hotmail.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-12-11 richard cooper male 19 3700 barrio gral jose de san martin tking@yahoo.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-12-11 donna bishop female 35 1636 la lucila david59@gmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-12-11 jade armstrong female 39 8370 caminera qhenry@gmail.com +univ. nacional del comahue bioquímica 2020-12-11 ryan conway male 17 1980 barrio la dolly ralvarez@gmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-12-11 cassandra lee female 21 2905 general rojo phillipscarl@yahoo.com +univ. nacional del comahue farmacia 2020-12-11 timothy santiago male 19 6472 francisco madero sara03@yahoo.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-12-11 morgan dennis female 31 2521 iturraspe johnsonleah@yahoo.com +univ. nacional del comahue licenciatura en musicoterapia 2020-12-11 jessica salinas female 35 5369 pagancillo ijackson@gmail.com +univ. nacional del comahue técnico para bioterios 2020-12-11 rita taylor female 19 2843 general galarza karensmith@gmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-12-11 sarah tran female 33 8122 la viticola petermclaughlin@yahoo.com +univ. nacional del comahue medicina 2020-12-11 brett mejia male 23 8351 agrio balsa dcook@yahoo.com +univ. nacional del comahue técnico para bioterios 2020-12-12 justin valenzuela male 33 5427 apeadero quiroga kelsey42@gmail.com +univ. nacional del comahue farmacia 2020-12-12 craig hawkins male 31 5331 andalucia klineandrew@yahoo.com +univ. nacional del comahue ingeniería en informática 2020-12-12 jeffrey villanueva male 21 8162 garcia del rio james54@hotmail.com +univ. nacional del comahue diseño de imagen y sonido 2020-12-12 grant jackson male 31 2181 los molinos yjohnson@hotmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-12-12 john santos male 37 1649 zona delta tigre rwarren@hotmail.com +univ. nacional del comahue arquitectura 2020-12-12 michael holmes male 39 9053 aguada grande mshaw@hotmail.com +univ. nacional del comahue medicina 2020-12-12 alan walter male 27 3480 algarrobal michael36@hotmail.com +univ. nacional del comahue bioquímica 2020-12-12 alexander bautista male 34 7600 barrio emir ramon juarez mcclaindanny@gmail.com +univ. nacional del comahue ingeniería en informática 2020-12-12 denise harper female 37 1871 dock sud ralph20@gmail.com +univ. nacional del comahue licenciatura en artes 2020-12-12 lawrence cannon male 39 3592 colonia hardy jessica37@hotmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-12-12 mark trevino male 27 5329 amuschina eheath@hotmail.com +univ. nacional del comahue técnico para bioterios 2020-12-12 maria larson female 30 8164 arquedas catherine31@gmail.com +univ. nacional del comahue farmacia 2020-12-12 robert myers male 17 3449 boliche lata jarvisjames@gmail.com +univ. nacional del comahue técnico para bioterios 2020-12-12 nicole garza female 17 2729 carreras lindapoole@gmail.com +univ. nacional del comahue licenciatura en artes 2020-12-12 leah baker female 37 2258 campo quiñones aprilparks@gmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-12-13 jillian hill female 39 9401 el zurdo douglasrice@yahoo.com +univ. nacional del comahue licenciatura en sociología 2020-12-13 timothy henry male 22 2154 capitan bermudez robertorobinson@yahoo.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-12-13 michael ford male 23 8158 aparicio nashjustin@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-12-13 john mcbride male 27 9030 rio mayo imedina@yahoo.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-12-13 joshua carr male 39 3283 colonia mabragaña webbdean@hotmail.com +univ. nacional del comahue medicina 2020-12-13 jordan gomez male 31 1897 manuel b gonnet david93@yahoo.com +univ. nacional del comahue contador público 2020-12-13 michael moore male 37 1713 barrio parque leloir tforbes@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-12-13 kevin rodriguez male 21 1865 el pampero melissadelgado@yahoo.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-12-13 william bell male 25 2109 acebal erin70@gmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-12-13 courtney anderson female 29 1615 grand bourg dudleymichael@hotmail.com +univ. nacional del comahue bioquímica 2020-12-13 carol hudson female 20 7241 la porteña faguilar@hotmail.com +univ. nacional del comahue técnico para bioterios 2020-12-13 denise kennedy female 35 6632 benitez ebishop@yahoo.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-12-14 eric chase male 35 2449 avena lopezemily@hotmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-12-14 jo shields female 31 1678 caseros hshields@yahoo.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-12-14 danielle wolfe female 20 7205 la esperanza rosas las flores carlsonphillip@hotmail.com +univ. nacional del comahue licenciatura en administración 2020-12-14 jessica hardy female 20 2152 granadero baigorria glennkyle@hotmail.com +univ. nacional del comahue licenciatura en artes 2020-12-14 johnny bowman male 19 1617 el talar hesssamantha@hotmail.com +univ. nacional del comahue farmacia 2020-12-14 catherine hubbard female 31 3700 barrio gral jose de san martin leslie55@hotmail.com +univ. nacional del comahue licenciatura en artes 2020-12-14 angela lowe female 31 9105 angostura rhunt@hotmail.com +univ. nacional del comahue licenciatura en sociología 2020-12-14 victoria sanchez female 29 1623 barrio garin norte qclarke@yahoo.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-12-14 carrie williams female 17 4622 bella vista asanchez@gmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-12-14 gilbert green male 22 5317 apoyaco mark28@yahoo.com +univ. nacional del comahue técnico para bioterios 2020-12-14 rachel martinez female 34 5386 amana jonathan93@hotmail.com +univ. nacional del comahue diseño de imagen y sonido 2020-12-14 joe davis male 35 5553 empalme frontera susan59@hotmail.com +univ. nacional del comahue ingeniería en informática 2020-12-14 sarah stanley female 29 6221 ceballos medinabilly@yahoo.com +univ. nacional del comahue licenciatura en artes 2020-12-15 robert ayala male 37 6748 membrillar ashley71@yahoo.com +univ. nacional del comahue actuario 2020-12-15 joseph davis male 37 2349 colonia dos rosas y la legua wooddennis@yahoo.com +univ. nacional del comahue farmacia 2020-12-15 christopher hall male 35 3380 9 de julio kilometro 20 mathisjacob@gmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-12-15 tammy sanders female 21 3405 algarrobal puisoye feliciaromero@yahoo.com +univ. nacional del comahue licenciatura en ciencia política 2020-12-15 chelsea wong female 19 8183 avestruz marcus90@hotmail.com +univ. nacional del comahue medicina 2020-12-15 christopher white male 37 7151 langueyu xreilly@hotmail.com +univ. nacional del comahue ingeniería mecánica 2020-12-15 jonathan skinner male 29 6405 30 de agosto kathy67@yahoo.com +univ. nacional del comahue ingeniería electrónica 2020-12-15 michael woodard male 21 6505 dudignac kimberly82@yahoo.com +univ. nacional del comahue medicina 2020-12-15 larry hernandez male 23 6305 atreuco travismedina@hotmail.com +univ. nacional del comahue ingeniería en informática 2020-12-15 john benton male 23 1669 del viso kimberly17@yahoo.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-12-15 leslie gray female 35 5438 alto de sierra jacquelinemiller@gmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-12-16 morgan schroeder female 26 6387 caleufu fharper@hotmail.com +univ. nacional del comahue diseño de imagen y sonido 2020-12-16 michael davies male 29 5527 colonia santa teresa ellislaura@gmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-12-16 william burnett male 39 2752 almacen el descanso rebecca10@gmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-12-16 rebecca jordan female 27 7118 general guido jenniferpennington@hotmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-12-17 peter salazar male 19 2609 colonia morgan kerry32@gmail.com +univ. nacional del comahue medicina 2020-12-17 shawn welch male 25 3199 los laureles tracie41@hotmail.com +univ. nacional del comahue contador público 2020-12-17 john garcia male 19 9301 el chalten frank69@hotmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-12-17 nicole farmer female 20 5311 arauco ashley41@gmail.com +univ. nacional del comahue arquitectura 2020-12-17 sandra fitzgerald female 17 7607 balneario atlantida reesemegan@yahoo.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-12-17 william gill male 35 5419 baños de la laja lewisjulie@hotmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-12-17 denise scott female 17 5590 adrian maturano nelsonjennifer@yahoo.com +univ. nacional del comahue actuario 2020-12-17 jennifer campbell female 33 2454 cañada rosquin ann68@gmail.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-12-17 mary marshall female 33 2124 22 de mayo richardsonandres@gmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-12-17 nicole brennan female 33 3023 cululu westwilliam@gmail.com +univ. nacional del comahue ingeniería mecánica 2020-12-17 jonathan gonzalez male 37 3234 bonpland stevearmstrong@gmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-12-18 david fernandez male 33 1642 san isidro austin97@yahoo.com +univ. nacional del comahue diseño industrial 2020-12-18 timothy fisher male 39 3567 dest aeronautico milit reconqu vlawrence@gmail.com +univ. nacional del comahue farmacia 2020-12-18 desiree green female 29 6235 villa sauce marybray@gmail.com +univ. nacional del comahue licenciatura en administración 2020-12-18 rachel rivera female 19 6300 barrancas coloradas obrown@yahoo.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-12-18 dorothy spears female 29 5361 aicuña kevincohen@hotmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-12-18 danny davis male 32 7404 fortin lavalle collinhamilton@yahoo.com +univ. nacional del comahue ciencias veterinarias 2020-12-18 felicia stewart female 21 5751 agua salada hlove@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-12-18 reginald ross male 39 2854 dos hermanas kdawson@hotmail.com +univ. nacional del comahue licenciatura en administración 2020-12-18 jennifer mcconnell female 36 2912 la querencia sanchezsean@gmail.com +univ. nacional del comahue licenciatura en psicología 2020-12-18 mary reyes female 24 6360 barrio el molino brianaustin@hotmail.com +univ. nacional del comahue técnico para bioterios 2020-12-18 sean keller male 21 4151 bajo de los sueldos utyler@yahoo.com +univ. nacional del comahue actuario 2020-12-18 michael anderson male 39 3530 aldea forestal ereed@yahoo.com +univ. nacional del comahue contador público 2020-12-18 steven rasmussen male 21 3583 isla tigre mario10@gmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-12-18 lisa osborne female 39 4655 cabreria guerrerobenjamin@hotmail.com +univ. nacional del comahue ingeniería en informática 2020-12-19 emily white female 37 4133 la banda ymyers@gmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-12-19 david mcgrath male 23 2183 arequito omorgan@gmail.com +univ. nacional del comahue licenciatura en administración 2020-12-19 mark erickson male 30 2173 campo pesoa snyderalicia@yahoo.com +univ. nacional del comahue diseño de imagen y sonido 2020-12-19 julie fernandez female 21 2751 almacen castro smithalicia@yahoo.com +univ. nacional del comahue arquitectura 2020-12-19 lauren baker female 38 1776 9 de abril nelsonscott@hotmail.com +univ. nacional del comahue actuario 2020-12-19 kathryn fox female 29 3181 arroyo moreira simpsoncharles@gmail.com +univ. nacional del comahue arquitectura 2020-12-19 rachel farrell female 33 8315 achico jonathon82@yahoo.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-12-19 jeffrey henderson male 39 5300 amilgancho duranjames@yahoo.com +univ. nacional del comahue licenciatura en ciencias de la computación 2020-12-19 alexandra christian female 29 2204 jesus maria vlyons@hotmail.com +univ. nacional del comahue ingeniería mecánica 2020-12-19 jillian henderson female 38 3192 colonia bertozzi kathygraham@yahoo.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-12-20 mary miller female 21 8363 colonia josefa bryantshannon@gmail.com +univ. nacional del comahue bioquímica 2020-12-20 larry jones male 38 9033 aldea apeleg miguel35@hotmail.com +univ. nacional del comahue licenciatura en administración 2020-12-20 scott ross male 39 8375 cañadon de los indios brenda35@hotmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-12-20 ricky villarreal male 19 6381 campo caretto zvaldez@gmail.com +univ. nacional del comahue agronomía 2020-12-20 jeff oneill male 37 3503 barranqueras julie39@gmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-12-20 ronald diaz male 17 1888 florencio varela heather84@hotmail.com +univ. nacional del comahue ciencias veterinarias 2020-12-20 justin klein male 33 9210 cuesta del ternero robertvega@gmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-12-20 richard ayala male 39 3364 2 de mayo gmartinez@hotmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-12-20 kyle davenport male 27 5573 colonia delfino jguerrero@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-12-20 joseph wilson male 17 3261 centella vmoore@yahoo.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-12-20 raymond moore male 22 2728 melincue deniseobrien@hotmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-12-20 betty rivera female 38 6325 colonia devoto scottdavis@gmail.com +univ. nacional del comahue actuario 2020-12-20 brenda moore female 21 3465 arroyo casco davidsonjacob@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-12-20 robert hahn male 39 8361 isla grande edwardrodriguez@hotmail.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-12-20 donald wright male 31 9305 cañada de las vacas angela77@hotmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-12-20 julie robertson female 37 2407 campo clucellas cjones@yahoo.com +univ. nacional del comahue arquitectura 2020-12-20 kevin richardson male 39 9013 cañadon seco christinejohnson@gmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-12-21 taylor taylor female 35 6352 colonia la india jeremyjones@hotmail.com +univ. nacional del comahue licenciatura en administración 2020-12-21 nancy flores female 21 1755 rafael castillo jacksoncantrell@gmail.com +univ. nacional del comahue arquitectura 2020-12-21 jessica morales female 19 5759 calera argentina rmay@gmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-12-21 heather rivera female 27 6237 america donald66@gmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-12-21 karen oconnor female 17 9051 aguada a pique gyoung@gmail.com +univ. nacional del comahue ingeniería mecánica 2020-12-21 jose wilson male 33 2500 cañada de gomez ystewart@yahoo.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-12-21 patricia robles female 32 6608 agote gdunn@hotmail.com +univ. nacional del comahue ciencias veterinarias 2020-12-21 eric donovan male 35 2313 colonia berlin jeanettealvarez@yahoo.com +univ. nacional del comahue medicina 2020-12-21 felicia miller female 23 3516 basail cjohnson@gmail.com +univ. nacional del comahue actuario 2020-12-21 denise payne female 33 6064 eduardo costa camachobrian@hotmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-12-21 denise meyers female 27 1804 canning sheripayne@gmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-12-22 lindsay parker female 29 9213 cañadon caliente simonderek@hotmail.com +univ. nacional del comahue contador público 2020-12-22 samantha baker female 25 2918 empalme villa constitucion samanthadouglas@gmail.com +univ. nacional del comahue ingeniería en informática 2020-12-22 ashley hamilton female 22 1640 acassuso peckchris@hotmail.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-12-22 vincent rodgers male 39 8156 el perdido est jose guisasola melissa16@hotmail.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-12-22 james nelson male 28 7547 cascada jamesmartinez@yahoo.com +univ. nacional del comahue ingeniería en informática 2020-12-22 steven henderson male 23 5429 el abanico tiffanymoody@gmail.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-12-22 alexander aguilar male 37 6559 recalde kellyangela@hotmail.com +univ. nacional del comahue licenciatura en psicología 2020-12-22 theodore avila male 33 3334 3 de mayo hartmegan@gmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-12-22 steven hawkins male 31 2826 aldea san antonio jaredarmstrong@yahoo.com +univ. nacional del comahue ingeniería mecánica 2020-12-22 tracy clark female 35 2601 la chispa stephaniewhite@gmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-12-22 scott bailey male 25 9101 alto de las plumas larry54@gmail.com +univ. nacional del comahue licenciatura en administración 2020-12-22 christopher bell male 33 1757 gregorio de laferrere egallegos@yahoo.com +univ. nacional del comahue contador público 2020-12-22 scott martin male 22 1647 zona delta san fernando frederick23@yahoo.com +univ. nacional del comahue técnico para bioterios 2020-12-23 krystal hill female 39 1828 banfield gregorygriffith@gmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2020-12-23 jessica collins female 19 3480 algarrobal howellkeith@hotmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-12-23 katherine caldwell female 23 3446 kilometro 374 angela44@gmail.com +univ. nacional del comahue arquitectura 2020-12-23 lisa bonilla female 29 3342 aguapey jennifermiles@gmail.com +univ. nacional del comahue farmacia 2020-12-23 kristina rodriguez female 21 3016 san jose weststeven@yahoo.com +univ. nacional del comahue técnico para bioterios 2020-12-23 bryan hall male 20 7172 colonia ferrari daniel68@yahoo.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-12-23 sara griffin female 37 3267 cañada de las ovejas elainegalloway@yahoo.com +univ. nacional del comahue diseño industrial 2020-12-23 jacqueline adams female 25 3300 arroyo jonathan33@gmail.com +univ. nacional del comahue ingeniería mecánica 2020-12-23 kristen fletcher female 27 6341 chapi talo josephlowery@gmail.com +univ. nacional del comahue bioquímica 2020-12-23 amanda henry female 27 6471 atahualpa uwagner@gmail.com +univ. nacional del comahue agronomía 2020-12-23 heidi tyler female 33 3487 puesto de isla david21@gmail.com +univ. nacional del comahue farmacia 2020-12-23 sean zhang male 37 9015 alma grande erik60@gmail.com +univ. nacional del comahue licenciatura en ciencias ambientales 2020-12-23 jeffrey miller male 36 8208 campo cicare johnthompson@gmail.com +univ. nacional del comahue agronomía 2020-12-23 gary christensen male 29 5505 carbometal james83@hotmail.com +univ. nacional del comahue diseño de imagen y sonido 2020-12-24 jason franco male 39 5883 alto lindo hillsteven@hotmail.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-12-24 rodney patterson male 17 7517 juan e barra courtneycisneros@gmail.com +univ. nacional del comahue medicina 2020-12-24 ashlee simmons female 19 3150 algarrobitos 1ro ysmith@hotmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-12-24 jack freeman male 17 3032 nelson xhartman@yahoo.com +univ. nacional del comahue ingeniería en informática 2020-12-24 michaela gibson female 25 3581 campo redondo aaronsanchez@gmail.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2020-12-24 samuel juarez male 23 5442 ambas puntillas bpatterson@gmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-12-24 john green male 33 7400 barrio la luisa alexanderkaren@gmail.com +univ. nacional del comahue licenciatura en psicología 2020-12-24 linda baker female 39 6034 colonia alberdi wtaylor@yahoo.com +univ. nacional del comahue ingeniería electrónica 2020-12-24 holly mcdonald female 35 6345 la bilbaina brett37@gmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-12-24 jennifer evans female 24 6555 alfalad uschmidt@hotmail.com +univ. nacional del comahue actuario 2020-12-24 colleen perkins female 38 3025 colonia clara mitchellcarly@hotmail.com +univ. nacional del comahue licenciatura en administración 2020-12-24 yesenia barrett female 17 6042 dos hermanos ksawyer@hotmail.com +univ. nacional del comahue agronomía 2020-12-24 arthur shaw male 25 5709 bañadito viejo johnwheeler@gmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-12-24 rebecca brown female 27 6472 francisco madero nicholasjones@gmail.com +univ. nacional del comahue licenciatura en artes 2020-12-25 ryan welch male 23 1915 arbuco bethcampbell@gmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-12-25 julie johnson female 23 4618 abra de pives james61@hotmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-12-25 linda franco female 26 4113 acostilla aking@gmail.com +univ. nacional del comahue ingeniería en informática 2020-12-25 joshua turner male 17 2240 campo garcia christopher85@gmail.com +univ. nacional del comahue diseño industrial 2020-12-25 jason mullins male 24 2611 estacion christophersen courtney33@hotmail.com +univ. nacional del comahue medicina 2020-12-25 andrea ryan female 33 9120 bahia cracher kevindecker@gmail.com +univ. nacional del comahue licenciatura en artes 2020-12-25 shannon ortega male 27 5713 balde ahumada alicia56@hotmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-12-25 kristen phelps female 39 6203 el olivo mingram@gmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-12-25 michael castillo male 35 2154 capitan bermudez sfox@gmail.com +univ. nacional del comahue medicina 2020-12-25 bradley miles male 37 6331 colonia beaufort floresrobert@yahoo.com +univ. nacional del comahue ingeniería mecánica 2020-12-25 janet bauer female 17 3581 campo redondo robert12@gmail.com +univ. nacional del comahue agronomía 2020-12-25 daniel armstrong male 17 1735 el durazno bjohnson@hotmail.com +univ. nacional del comahue licenciatura en administración 2020-12-25 nicole johnson female 33 8375 cañadon de los indios spencer19@hotmail.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-12-25 carolyn fisher female 21 7221 francisco berra tammyaustin@yahoo.com +univ. nacional del comahue licenciatura en psicología 2020-12-25 jose vaughn male 26 3137 alcaraz sud andersoncheryl@gmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-12-25 meghan williams female 37 9311 cañadon leon burkedavid@hotmail.com +univ. nacional del comahue diseño industrial 2020-12-26 robert wang male 17 6632 benitez jennifer19@gmail.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-12-26 karen wilson female 29 3040 asuncion maria michele22@yahoo.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-12-26 carrie ferguson female 19 6300 barrancas coloradas martinball@yahoo.com +univ. nacional del comahue diseño industrial 2020-12-26 robert west male 17 2607 campo quirno wheelerdouglas@yahoo.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-12-26 heidi hughes female 40 2520 la california john91@yahoo.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-12-26 deborah alvarez female 35 6369 campo salusso chapmanchristopher@hotmail.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-12-26 jason rojas male 35 1648 rincon de milberg christinapatrick@hotmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-12-26 april flynn female 29 3705 10 de mayo ffischer@hotmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-12-26 janice robinson female 39 7301 ariel roachalexandra@yahoo.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-12-26 kimberly hayes female 33 3056 campo coubert tracey11@yahoo.com +univ. nacional del comahue diseño industrial 2020-12-27 lindsay johnson female 23 3050 calchaqui rjones@hotmail.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2020-12-27 cody smith male 33 3705 10 de mayo kestrada@yahoo.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-12-27 jessica dominguez female 35 7225 casalins michaeldiaz@hotmail.com +univ. nacional del comahue bioquímica 2020-12-27 mark alvarado male 31 5513 barrio jardin luzuriaga colleenrichardson@yahoo.com +univ. nacional del comahue técnico para bioterios 2020-12-27 catherine reynolds female 33 3466 abalo hannahvaughn@yahoo.com +univ. nacional del comahue ingeniería electrónica 2020-12-27 shelly taylor female 39 7623 campo la plata mckinneyjacob@gmail.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-12-27 jennifer boyd female 31 3185 colonia la marta gentryjennifer@yahoo.com +univ. nacional del comahue contador público 2020-12-27 willie lee male 19 8334 ingeniero huergo robinwilliams@gmail.com +univ. nacional del comahue licenciatura en psicología 2020-12-27 ryan curtis male 29 5779 la chilca travisbaird@gmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2020-12-27 robert cox male 27 7408 la colina washingtonlisa@hotmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2020-12-27 kristen perkins female 17 6475 esteban de luca yhernandez@hotmail.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-12-28 robert gregory male 18 3254 colonia la blanquita rhodesjennifer@hotmail.com +univ. nacional del comahue farmacia 2020-12-28 angela pruitt female 39 7407 libano schambers@hotmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-12-28 aaron roy male 21 3200 colonia los sauces lindsey61@hotmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2020-12-28 sarah johnson female 25 5592 el carbalino clarkeallison@gmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-12-28 nathan johnson male 23 3722 2 de mayo peterwhite@hotmail.com +univ. nacional del comahue arquitectura 2020-12-28 william johnson male 21 3117 aldea san antonio smithcody@yahoo.com +univ. nacional del comahue licenciatura en ciencias biológicas 2020-12-28 diana hines female 33 6326 anguil fsmith@yahoo.com +univ. nacional del comahue diseño industrial 2020-12-28 zachary stafford male 25 6348 bocayuba taylorshort@gmail.com +univ. nacional del comahue licenciatura en artes 2020-12-28 jason brown male 31 6042 dos hermanos crystalmccoy@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-12-28 christopher walker male 33 7169 juancho christinamendoza@yahoo.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2020-12-28 jacqueline hamilton female 36 5615 25 de mayo thomas65@gmail.com +univ. nacional del comahue licenciatura en musicoterapia 2020-12-28 troy nelson male 37 8113 baterias collinsjennifer@gmail.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-12-28 kyle saunders male 25 9405 bahia tranquila gloriawilson@hotmail.com +univ. nacional del comahue licenciatura en sociología 2020-12-29 amber stevenson female 29 6032 blandengues jeffmorgan@hotmail.com +univ. nacional del comahue bioquímica 2020-12-29 jennifer lam female 35 2633 chovet perezjeremy@hotmail.com +univ. nacional del comahue ingeniería mecánica 2020-12-29 jason dean male 31 6403 badano austincarlson@hotmail.com +univ. nacional del comahue licenciatura en ciencia política 2020-12-29 madeline caldwell female 33 3020 campo santo domingo osbornejoy@hotmail.com +univ. nacional del comahue diseño de imagen y sonido 2020-12-29 joe rodriguez male 33 5738 avanzada isaiahwilcox@yahoo.com +univ. nacional del comahue ingeniería en informática 2020-12-29 zachary reeves male 19 3332 capiovi townsenddawn@yahoo.com +univ. nacional del comahue licenciatura en sociología 2020-12-29 eddie watkins male 39 5605 calle larga vieja martinrandall@yahoo.com +univ. nacional del comahue ingeniería en informática 2020-12-29 dawn martinez female 21 8183 avestruz summersalexander@yahoo.com +univ. nacional del comahue licenciatura en artes 2020-12-30 jordan brooks male 27 8109 almirante solier kristinhowe@gmail.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-12-30 richard singh male 17 6621 anderson hkramer@gmail.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-12-30 karen castro female 33 6348 bocayuba erickrueger@hotmail.com +univ. nacional del comahue ingeniería electrónica 2020-12-30 wayne hayden male 17 3592 colonia hardy farmersusan@yahoo.com +univ. nacional del comahue licenciatura en terapia ocupacional 2020-12-30 gregory blair male 31 3174 altamirano sud karencochran@yahoo.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-12-31 jonathan shelton male 29 6463 alagon davidlawson@yahoo.com +univ. nacional del comahue diseño de imagen y sonido 2020-12-31 larry george male 29 4133 la banda davidrobinson@hotmail.com +univ. nacional del comahue licenciatura en artes 2020-12-31 debra jones female 23 5470 abra verde adamsrobert@gmail.com +univ. nacional del comahue licenciatura en psicología 2020-12-31 michele fields female 20 4111 aguada ecarey@yahoo.com +univ. nacional del comahue licenciatura en ciencias de la educación 2020-12-31 kelly white female 20 1737 kilometro 77 jsalinas@hotmail.com +univ. nacional del comahue técnico para bioterios 2020-12-31 tina macdonald female 29 1838 luis guillon justin58@gmail.com +univ. nacional del comahue contador público 2020-12-31 cole ellis male 20 4147 alto las lechuzas laurengray@hotmail.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2020-12-31 natasha arnold female 19 2170 candelaria sud christopherwade@yahoo.com +univ. nacional del comahue actuario 2020-12-31 shelley rodgers female 21 1678 caseros john99@gmail.com +univ. nacional del comahue medicina 2020-12-31 mark scott male 30 8127 estela kimberlydavis@yahoo.com +univ. nacional del comahue farmacia 2020-12-31 sarah lee female 37 5529 colonia bombal craigthomas@gmail.com +univ. nacional del comahue bioquímica 2020-12-31 julie browning female 35 1682 martin coronado weberrandy@yahoo.com +univ. nacional del comahue licenciatura en psicología 2020-12-31 lisa davis female 27 2121 perez iallen@gmail.com +univ. nacional del comahue ingeniería electrónica 2020-12-31 lisa downs female 21 6727 gouin monica97@gmail.com +univ. nacional del comahue ingeniería mecánica 2021-01-01 garrett navarro male 35 1631 villa rosa pdouglas@gmail.com +univ. nacional del comahue arquitectura 2021-01-01 courtney gay female 19 1858 villa numancia andreafrost@gmail.com +univ. nacional del comahue ciencias veterinarias 2021-01-01 wendy aguilar female 29 6533 alfredo demarchi holtemily@yahoo.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2021-01-01 robert rogers male 37 4504 23 de agosto stewartcrystal@gmail.com +univ. nacional del comahue ingeniería mecánica 2021-01-01 sarah key female 25 3416 arroyo ceibal smithmichelle@gmail.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2021-01-01 stephen mathis male 39 5557 caracoles christine82@yahoo.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2021-01-01 lisa palmer female 25 3530 aldea forestal anthony05@hotmail.com +univ. nacional del comahue licenciatura en artes 2021-01-01 nichole jackson female 33 3351 azara sbass@gmail.com +univ. nacional del comahue ingeniería mecánica 2021-01-01 susan garcia female 28 7150 ayacucho gscott@hotmail.com +univ. nacional del comahue actuario 2021-01-01 melinda gutierrez female 17 1891 ingeniero allan halvarado@hotmail.com +univ. nacional del comahue licenciatura en artes 2021-01-01 john glover male 21 6434 palantelen morriskevin@gmail.com +univ. nacional del comahue licenciatura en psicología 2021-01-02 jill garcia female 27 3450 8 de diciembre meganfarmer@hotmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2021-01-02 wayne reynolds male 25 9007 el jaguel johncabrera@hotmail.com +univ. nacional del comahue ciencias veterinarias 2021-01-02 jason wall male 33 2242 arijon flove@yahoo.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2021-01-02 laura johnson female 19 5873 isla jacob67@yahoo.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2021-01-02 karen scott female 19 8333 aguada guzman taylorholmes@gmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2021-01-02 joy bryant female 35 9009 cañadon lagarto connor86@gmail.com +univ. nacional del comahue licenciatura en administración 2021-01-02 kevin hernandez male 19 3423 arañita richardscharles@hotmail.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2021-01-02 douglas thomas male 29 5596 12 de octubre brandy35@hotmail.com +univ. nacional del comahue licenciatura en musicoterapia 2021-01-02 tina smith female 23 8500 el dique hlopez@gmail.com +univ. nacional del comahue diseño de imagen y sonido 2021-01-02 bobby lowe male 28 8111 arroyo pareja hayley34@yahoo.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2021-01-02 natalie nelson female 27 1646 san fernando johnshaw@yahoo.com +univ. nacional del comahue licenciatura en sociología 2021-01-02 erika flores female 28 5465 baños pismanta adamswilliam@gmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2021-01-02 joann charles female 23 2852 alarcon ydavis@gmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2021-01-02 michelle harris female 27 3214 estacion yerua goodrobert@yahoo.com +univ. nacional del comahue ingeniería en informática 2021-01-03 albert moran male 25 3190 arroyo hondo ellen71@hotmail.com +univ. nacional del comahue licenciatura en musicoterapia 2021-01-03 robert nielsen male 35 5615 25 de mayo cynthia17@yahoo.com +univ. nacional del comahue actuario 2021-01-03 parker hunter male 17 1619 garin michealdavis@hotmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2021-01-03 justin franklin male 28 4740 agua salada kkaufman@gmail.com +univ. nacional del comahue técnico para bioterios 2021-01-03 jennifer schroeder female 27 2722 wheelwright danielle61@yahoo.com +univ. nacional del comahue licenciatura en psicología 2021-01-03 scott coleman male 21 3158 20 de septiembre gutierrezscott@hotmail.com +univ. nacional del comahue medicina 2021-01-03 eric thompson male 22 1894 juan vucetich ex dr r levene lauren78@gmail.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2021-01-03 julie wilson female 40 3583 isla tigre michelle69@hotmail.com +univ. nacional del comahue licenciatura en terapia ocupacional 2021-01-03 todd brown male 35 3287 aldea san gregorio martinjames@hotmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2021-01-03 sarah roberts female 31 2218 carrizales wrightbrendan@hotmail.com +univ. nacional del comahue técnico para bioterios 2021-01-03 thomas silva male 22 1864 alejandro korn davidfoster@hotmail.com +univ. nacional del comahue farmacia 2021-01-03 shane taylor male 29 3509 campo el bermejo hendersonamber@hotmail.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2021-01-03 anna phillips female 33 5637 30 de octubre vaughnjohn@yahoo.com +univ. nacional del comahue licenciatura en sociología 2021-01-03 walter marquez male 31 7263 el chumbeau michael27@gmail.com +univ. nacional del comahue licenciatura en musicoterapia 2021-01-03 misty carter female 19 5751 agua salada tasha15@yahoo.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2021-01-03 raymond watson male 31 5461 aguada de la peña brittanychristian@hotmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2021-01-04 joseph mason male 39 5622 colonia jauregui fmathis@hotmail.com +univ. nacional del comahue licenciatura en ciencias ambientales 2021-01-04 sabrina robertson female 29 6348 bocayuba franklinmark@gmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2021-01-04 benjamin simmons male 39 6434 palantelen kelly15@hotmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2021-01-04 william grimes male 29 4600 algarrobal nicolecallahan@gmail.com +univ. nacional del comahue farmacia 2021-01-04 ashley russell female 25 2352 ambrosetti anthony45@hotmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2021-01-04 george wright male 29 8416 anecon grande megan83@yahoo.com +univ. nacional del comahue licenciatura en sociología 2021-01-04 amanda mcdaniel female 18 5319 colpes tammysharp@hotmail.com +univ. nacional del comahue medicina 2021-01-04 felicia coleman female 31 8146 el rincon hwilliams@yahoo.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2021-01-05 judith mcfarland female 19 3545 kilometro 525 ngreen@hotmail.com +univ. nacional del comahue bioquímica 2021-01-05 norma owen female 29 5719 agua amarga xcampbell@yahoo.com +univ. nacional del comahue ciencias veterinarias 2021-01-05 theodore smith male 21 9001 cañadon ferrais duane94@hotmail.com +univ. nacional del comahue contador público 2021-01-05 tyler nguyen male 24 2501 berretta prubio@yahoo.com +univ. nacional del comahue licenciatura en psicología 2021-01-05 elizabeth alvarez female 27 8521 arroyo de la ventana irobles@hotmail.com +univ. nacional del comahue ingeniería en informática 2021-01-05 kyle hall male 39 9420 aserradero arroyo christina68@yahoo.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2021-01-05 lindsey parsons female 37 5447 agua cercada acampbell@gmail.com +univ. nacional del comahue ingeniería en informática 2021-01-05 adam hines male 21 8370 caminera alvarezkristin@hotmail.com +univ. nacional del comahue medicina 2021-01-05 david ross male 17 3114 aldea maria luisa raustin@gmail.com +univ. nacional del comahue licenciatura en ciencias ambientales 2021-01-05 michele miller female 26 3041 cacique ariacaiquin tmolina@yahoo.com +univ. nacional del comahue ingeniería en informática 2021-01-05 tamara johnson female 29 2103 colonia escribano catherinedaniels@yahoo.com +univ. nacional del comahue medicina 2021-01-05 trevor nguyen male 35 9311 cañadon leon alexander06@gmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2021-01-05 marie bruce female 21 4643 antiguyos vfreeman@gmail.com +univ. nacional del comahue licenciatura en musicoterapia 2021-01-06 danielle mason female 25 3555 campo huber david48@yahoo.com +univ. nacional del comahue diseño industrial 2021-01-06 robert griffith male 17 3133 arroyo burgos christian64@yahoo.com +univ. nacional del comahue licenciatura en psicología 2021-01-06 elizabeth miller female 21 2181 los molinos monica02@yahoo.com +univ. nacional del comahue licenciatura en ciencias biológicas 2021-01-06 brian norton male 39 6321 caichue kristen61@yahoo.com +univ. nacional del comahue contador público 2021-01-06 gavin taylor male 25 3003 colonia los zapallos edward24@hotmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2021-01-06 howard lee male 33 8407 correntoso christian72@hotmail.com +univ. nacional del comahue actuario 2021-01-06 elizabeth scott female 29 2400 villani whitney13@hotmail.com +univ. nacional del comahue licenciatura en artes 2021-01-06 robert thomas male 27 9015 alma grande woodardjeremy@hotmail.com +univ. nacional del comahue bioquímica 2021-01-06 gregory thompson male 19 3371 cabure mcdowellrobert@gmail.com +univ. nacional del comahue actuario 2021-01-06 renee smith female 17 6001 agustin roca scoleman@hotmail.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2021-01-06 danielle thornton female 25 6439 bonifacio nking@hotmail.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2021-01-06 eric allen male 27 3513 arbol solo michellebenson@gmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2021-01-06 jessica daniel female 35 2723 estancia las gamas grantbrent@hotmail.com +univ. nacional del comahue licenciatura en musicoterapia 2021-01-07 richard morgan male 37 8124 berraondo odonnellgrant@hotmail.com +univ. nacional del comahue licenciatura en ciencia política 2021-01-07 jill reed female 35 5535 asuncion stephaniegriffith@gmail.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2021-01-07 carmen estrada female 38 5609 aristides villanueva wsmith@gmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2021-01-07 alexandra richards female 35 5871 la aguada de las animas fscott@hotmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2021-01-07 tyler smith male 25 1875 wilde rita46@yahoo.com +univ. nacional del comahue licenciatura en administración 2021-01-07 ryan anderson male 23 2840 albardon josephwhite@gmail.com +univ. nacional del comahue ingeniería en informática 2021-01-07 elaine howell female 27 2743 arroyo dulce eddieclark@gmail.com +univ. nacional del comahue ciencias veterinarias 2021-01-07 allison jones female 31 7212 doctor domingo harosteguy beth01@hotmail.com +univ. nacional del comahue licenciatura en terapia ocupacional 2021-01-07 sara klein female 24 2728 melincue tanyaboone@yahoo.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2021-01-07 kristen thomas female 40 8168 sierra de la ventana william36@hotmail.com +univ. nacional del comahue licenciatura en musicoterapia 2021-01-07 ronald young male 25 1895 arturo segui chandlermark@gmail.com +univ. nacional del comahue ingeniería en informática 2021-01-07 brandon johnson male 31 3536 bocas newmanmelissa@hotmail.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2021-01-07 donna sims female 17 3076 huanqueros lindseysawyer@hotmail.com +univ. nacional del comahue licenciatura en artes 2021-01-07 christopher ballard male 21 4147 alto las lechuzas valexander@hotmail.com +univ. nacional del comahue licenciatura en artes 2021-01-08 karina pace female 35 7311 chillar ronald53@yahoo.com +univ. nacional del comahue licenciatura en terapia ocupacional 2021-01-08 brett hansen male 21 5881 cañada la negra xcole@yahoo.com +univ. nacional del comahue licenciatura en artes 2021-01-08 jerry jones male 29 1812 carlos spegazzini irichardson@yahoo.com +univ. nacional del comahue ingeniería mecánica 2021-01-08 patrick smith male 29 3234 bonpland qnorman@yahoo.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2021-01-08 lauren hunter female 19 1983 gomez sgross@yahoo.com +univ. nacional del comahue licenciatura en sociología 2021-01-08 christian dennis male 35 6469 asturias johnjones@yahoo.com +univ. nacional del comahue licenciatura en psicología 2021-01-08 deborah nolan female 39 4124 abra el candado jbaker@yahoo.com +univ. nacional del comahue licenciatura en ciencias de la educación 2021-01-08 timothy harris male 37 6538 la dorita qpierce@gmail.com +univ. nacional del comahue técnico para bioterios 2021-01-08 anthony sweeney male 23 5722 acasape brookerice@hotmail.com +univ. nacional del comahue ingeniería en informática 2021-01-08 vincent anderson male 36 8309 centenario uandrade@gmail.com +univ. nacional del comahue licenciatura en ciencias ambientales 2021-01-08 taylor jensen female 17 3712 los frentones vanessawall@yahoo.com +univ. nacional del comahue arquitectura 2021-01-08 david cardenas male 17 3441 algarrobo irodriguez@yahoo.com +univ. nacional del comahue arquitectura 2021-01-08 daniel pitts male 33 6317 la florencia williamsjessica@yahoo.com +univ. nacional del comahue contador público 2021-01-09 brandi murray female 23 3407 aguay vdavis@gmail.com +univ. nacional del comahue licenciatura en psicología 2021-01-09 frank greene male 19 2637 colonia hansen taylorriley@yahoo.com +univ. nacional del comahue licenciatura en terapia ocupacional 2021-01-09 michael peterson male 23 3382 colonia cunci myersjeff@yahoo.com +univ. nacional del comahue licenciatura en ciencias de la educación 2021-01-09 timothy anderson male 39 5775 bajo grande odavies@hotmail.com +univ. nacional del comahue diseño de imagen y sonido 2021-01-09 john morrow male 21 3734 campo moreno wbailey@yahoo.com +univ. nacional del comahue licenciatura en ciencias biológicas 2021-01-09 michael mcdonald male 25 3000 barranquitas benjamin45@yahoo.com +univ. nacional del comahue técnico para bioterios 2021-01-09 amy smith female 33 5750 alto de la leña robertdaniels@hotmail.com +univ. nacional del comahue licenciatura en administración 2021-01-09 jaime martinez female 39 8514 laguna del barro danielsweeney@yahoo.com +univ. nacional del comahue licenciatura en administración 2021-01-09 keith collins male 33 1921 alvarez jonte cmiller@yahoo.com +univ. nacional del comahue agronomía 2021-01-09 jose lee male 27 1882 ezpeleta este hyoung@hotmail.com +univ. nacional del comahue farmacia 2021-01-09 austin barnett male 21 4750 agua colorada xrogers@hotmail.com +univ. nacional del comahue licenciatura en sociología 2021-01-09 amy flores female 19 8200 colonia lia y allende pcabrera@hotmail.com +univ. nacional del comahue ingeniería mecánica 2021-01-09 deanna neal female 17 8403 alicura taylorrichard@hotmail.com +univ. nacional del comahue bioquímica 2021-01-09 jessica evans female 30 1911 bme bavio gral mansilla tina86@hotmail.com +univ. nacional del comahue licenciatura en ciencia política 2021-01-09 suzanne pearson female 25 6330 arturo almaraz keith43@yahoo.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2021-01-09 andrew mcpherson male 34 2814 alto los cardales turnerangela@gmail.com +univ. nacional del comahue licenciatura en psicología 2021-01-09 jay robinson male 19 2156 arsenal de guerra san lorenzo gchavez@gmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2021-01-09 kenneth hernandez male 35 1625 arroyo canelon pughrebecca@hotmail.com +univ. nacional del comahue ingeniería electrónica 2021-01-09 katherine brown female 33 3378 22 de diciembre fernandezmaria@hotmail.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2021-01-10 elizabeth avila female 33 5703 6 de septiembre williammccormick@hotmail.com +univ. nacional del comahue agronomía 2021-01-10 steven gross male 23 2318 aurelia amy54@hotmail.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2021-01-10 peter rhodes male 19 3380 9 de julio kilometro 20 vcarey@yahoo.com +univ. nacional del comahue ingeniería mecánica 2021-01-10 cassandra acosta female 35 8332 colonia rusa wayne25@gmail.com +univ. nacional del comahue agronomía 2021-01-10 brad gonzalez male 39 4186 cañete leahwoods@yahoo.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2021-01-10 carolyn byrd female 37 8403 alicura andreowens@gmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2021-01-10 elizabeth lam female 27 6400 barrio indio trompa austinthomas@hotmail.com +univ. nacional del comahue licenciatura en sociología 2021-01-10 travis bell male 21 6326 anguil daniel95@hotmail.com +univ. nacional del comahue diseño de imagen y sonido 2021-01-11 jerry stanley male 34 3572 campo garabato hernandezcynthia@hotmail.com +univ. nacional del comahue actuario 2021-01-11 lance hoffman male 21 7407 libano nortonmarc@hotmail.com +univ. nacional del comahue licenciatura en administración 2021-01-11 kevin king male 32 7509 oriente lvega@gmail.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2021-01-11 ashley gordon female 39 9121 aguada de las tejas toconnor@yahoo.com +univ. nacional del comahue farmacia 2021-01-11 douglas joseph male 19 5340 agua grande williamwilson@hotmail.com +univ. nacional del comahue arquitectura 2021-01-11 raymond ellis male 17 3061 antonio pini vincent52@hotmail.com +univ. nacional del comahue técnico para bioterios 2021-01-11 stephen sanchez male 27 3023 cululu lowerysarah@gmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2021-01-11 amy robinson female 26 6430 adolfo alsina nmartin@yahoo.com +univ. nacional del comahue licenciatura en musicoterapia 2021-01-11 tanya barrera female 27 7136 adela ugonzalez@gmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2021-01-11 jesus miller male 19 9220 cañadon la madera vangshawn@gmail.com +univ. nacional del comahue licenciatura en administración 2021-01-11 nicole watkins female 19 2438 frontera paul24@yahoo.com +univ. nacional del comahue ingeniería electrónica 2021-01-11 patrick perez male 27 3138 alcaraz 2do imoore@yahoo.com +univ. nacional del comahue licenciatura en artes 2021-01-11 william lewis male 33 2643 cafferata websterjames@gmail.com +univ. nacional del comahue agronomía 2021-01-11 ashley reeves female 31 5607 colonia bombal y tabanera shaffersandra@gmail.com +univ. nacional del comahue actuario 2021-01-12 luke dougherty male 23 5773 cañada williamtaylor@yahoo.com +univ. nacional del comahue licenciatura en ciencias geológicas 2021-01-12 jacob stout male 17 3555 campo huber ulutz@gmail.com +univ. nacional del comahue licenciatura en administración 2021-01-12 brenda robles female 39 6509 del valle marymckee@yahoo.com +univ. nacional del comahue farmacia 2021-01-12 jennifer woodard female 21 7247 barrientos daniel14@hotmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2021-01-12 john miller male 35 7005 barker robertobowen@yahoo.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2021-01-12 jeffrey jacobson male 29 7105 san clemente del tuyu michael83@hotmail.com +univ. nacional del comahue licenciatura en ciencias ambientales 2021-01-12 timothy lewis male 23 5475 agua de la piedra sandersdeborah@yahoo.com +univ. nacional del comahue diseño de imagen y sonido 2021-01-12 jessica schmitt female 17 5595 cupiles mstanley@gmail.com +univ. nacional del comahue medicina 2021-01-12 david hodge male 37 3412 albardon margaretfigueroa@hotmail.com +univ. nacional del comahue medicina 2021-01-12 thomas franklin male 32 2443 colonia margarita sandovallawrence@yahoo.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2021-01-12 krista clayton female 37 6625 cañada la rica maurice27@hotmail.com +univ. nacional del comahue diseño industrial 2021-01-12 laura rivas female 37 7305 antonio de los heros bettyrodriguez@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2021-01-12 randy hawkins male 26 9000 comodoro rivadavia privas@gmail.com +univ. nacional del comahue arquitectura 2021-01-12 charles cook male 25 1670 nordelta leroy48@hotmail.com +univ. nacional del comahue licenciatura en ciencias ambientales 2021-01-12 richard rodgers male 39 8504 cantera villalonga blake44@gmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2021-01-12 beverly gonzalez female 35 6105 cañada seca muellerjoseph@gmail.com +univ. nacional del comahue ingeniería mecánica 2021-01-12 melanie mason female 39 9421 frigorifico cap taylorbrittany@yahoo.com +univ. nacional del comahue arquitectura 2021-01-13 katherine jackson female 31 7226 gorchs javier55@yahoo.com +univ. nacional del comahue arquitectura 2021-01-13 terri olson female 19 3190 arroyo hondo nathan96@gmail.com +univ. nacional del comahue ingeniería mecánica 2021-01-13 courtney martinez female 31 1650 general san martin sandy97@hotmail.com +univ. nacional del comahue arquitectura 2021-01-13 richard hatfield male 31 3487 puesto de isla brianpowell@gmail.com +univ. nacional del comahue ingeniería electrónica 2021-01-13 shelley swanson female 31 6503 desvio kilometro 234 gregory87@gmail.com +univ. nacional del comahue ingeniería mecánica 2021-01-13 virginia mitchell female 33 5741 13 de enero allison88@hotmail.com +univ. nacional del comahue ingeniería electrónica 2021-01-13 matthew bennett male 35 2301 bella italia fmoran@yahoo.com +univ. nacional del comahue actuario 2021-01-13 stephen moore male 21 5276 baldes de pacheco randy37@yahoo.com +univ. nacional del comahue actuario 2021-01-13 brandon smith male 31 7003 aceilan samantha03@gmail.com +univ. nacional del comahue ciencias veterinarias 2021-01-14 christine flowers female 19 5275 agua colorada michael56@yahoo.com +univ. nacional del comahue contador público 2021-01-14 melissa adams female 34 5717 el pimpollo preyes@hotmail.com +univ. nacional del comahue licenciatura en terapia ocupacional 2021-01-14 joshua knight male 19 7001 la pastora gabrielgallagher@hotmail.com +univ. nacional del comahue diseño industrial 2021-01-14 danielle peterson female 31 2814 alto los cardales kjohnson@hotmail.com +univ. nacional del comahue licenciatura en musicoterapia 2021-01-14 blake campbell male 23 2128 arroyo seco herringconnie@hotmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2021-01-14 nicholas hunter male 25 5721 agua seballe taylordavid@hotmail.com +univ. nacional del comahue licenciatura en psicología 2021-01-14 michael villa male 33 9101 alto de las plumas pauldenise@gmail.com +univ. nacional del comahue licenciatura en psicología 2021-01-14 logan decker male 25 2747 coronel isleños johnsongloria@yahoo.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2021-01-14 sarah martin female 21 4230 brea chimpana kenneth21@hotmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2021-01-14 kevin robles male 39 4147 alto las lechuzas daniel72@gmail.com +univ. nacional del comahue licenciatura en musicoterapia 2021-01-14 erica ware female 21 5724 alto pencoso kevin51@yahoo.com +univ. nacional del comahue ingeniería electrónica 2021-01-14 james hoffman male 31 9310 aguada alegre jamiejohnson@hotmail.com +univ. nacional del comahue actuario 2021-01-14 heather combs female 29 2240 campo garcia kelliott@gmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2021-01-15 michael montoya male 23 2701 12 de agosto lmartinez@gmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2021-01-15 mario johnson male 27 9111 bahia bustamante tsolis@gmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2021-01-15 suzanne williams female 23 8175 goyena brenda30@yahoo.com +univ. nacional del comahue farmacia 2021-01-15 alexander mccoy male 29 5515 maipu wendy07@gmail.com +univ. nacional del comahue diseño de imagen y sonido 2021-01-15 christina hogan female 17 5365 el jumeal jordangary@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2021-01-15 jacqueline wilson female 33 7160 la union jesparza@yahoo.com +univ. nacional del comahue licenciatura en sociología 2021-01-15 sarah dickerson female 35 3580 kilometro 408 andersonnicholas@gmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2021-01-15 christopher brown male 35 5733 cramer wmartinez@yahoo.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2021-01-15 melissa solis female 23 8111 arroyo pareja diamondclark@gmail.com +univ. nacional del comahue diseño de imagen y sonido 2021-01-15 rachel parker female 27 8160 fortin chaco michael14@hotmail.com +univ. nacional del comahue licenciatura en ciencia política 2021-01-15 joseph harris male 17 7519 san mayol brittney42@yahoo.com +univ. nacional del comahue arquitectura 2021-01-15 roy thomas male 23 2808 atucha lewisrobin@yahoo.com +univ. nacional del comahue diseño industrial 2021-01-15 michael williams male 27 1640 acassuso jameslewis@hotmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2021-01-15 john obrien male 37 5417 9 de julio brandon10@hotmail.com +univ. nacional del comahue licenciatura en administración 2021-01-15 megan moss female 25 2508 armstrong michellethompson@gmail.com +univ. nacional del comahue licenciatura en administración 2021-01-15 sandra rodriguez female 17 7503 cristiano muerto benjamin95@hotmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2021-01-15 kenneth adams male 19 1761 20 de junio douglas67@hotmail.com +univ. nacional del comahue diseño industrial 2021-01-15 kathy jones female 21 3003 colonia los zapallos bscott@yahoo.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2021-01-16 benjamin reese male 17 1889 bosques wrightralph@gmail.com +univ. nacional del comahue licenciatura en artes 2021-01-16 jacob garner male 18 6207 alta italia warnermichael@yahoo.com +univ. nacional del comahue diseño de imagen y sonido 2021-01-16 david thomas male 30 3132 el pingo rosefrederick@gmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2021-01-16 ana evans female 27 7226 gorchs barbarafarrell@gmail.com +univ. nacional del comahue licenciatura en artes 2021-01-16 christopher park male 21 9203 aldea escolar wilsondebra@gmail.com +univ. nacional del comahue ingeniería mecánica 2021-01-16 eric barr male 29 1744 cuartel v pattersonjonathan@gmail.com +univ. nacional del comahue agronomía 2021-01-16 anna morales female 21 4651 agua de castilla woodjulie@yahoo.com +univ. nacional del comahue licenciatura en ciencias biológicas 2021-01-16 nathan anderson male 27 6075 arenaza parkerwilliam@gmail.com +univ. nacional del comahue diseño industrial 2021-01-16 john yu male 25 3380 9 de julio kilometro 20 aaron55@yahoo.com +univ. nacional del comahue licenciatura en ciencias de la computación 2021-01-16 heather santos female 23 1684 ciudad jardin del palomar wilsonjulie@yahoo.com +univ. nacional del comahue ingeniería mecánica 2021-01-16 tina carroll female 19 2301 bella italia dawn50@hotmail.com +univ. nacional del comahue medicina 2021-01-16 anthony dean male 21 3009 el tropezon aaronsmith@yahoo.com +univ. nacional del comahue licenciatura en ciencias biológicas 2021-01-16 samuel rivera male 35 2311 adolfo alsina hyoder@gmail.com +univ. nacional del comahue licenciatura en administración 2021-01-17 charles hughes male 30 2806 las palmas loganronald@hotmail.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2021-01-17 justin bass male 21 3543 colonia lote 12 gvelez@yahoo.com +univ. nacional del comahue licenciatura en ciencias de la educación 2021-01-17 joanna montoya female 29 3712 los frentones tammyclark@hotmail.com +univ. nacional del comahue ingeniería en informática 2021-01-17 randy rojas male 33 4164 bajastine cwebb@hotmail.com +univ. nacional del comahue ingeniería electrónica 2021-01-17 lori randall female 17 6455 carlos tejedor tami95@yahoo.com +univ. nacional del comahue agronomía 2021-01-17 roberto joseph male 37 6036 diego de alvear treed@gmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2021-01-17 sherry jones female 25 2605 otto bemberg carriesims@yahoo.com +univ. nacional del comahue licenciatura en ciencias de la educación 2021-01-17 michael fisher male 30 3000 barranquitas mclaughlincheryl@yahoo.com +univ. nacional del comahue licenciatura en terapia ocupacional 2021-01-17 brian myers male 29 6734 rawson knightmatthew@yahoo.com +univ. nacional del comahue licenciatura en ciencias de la computación 2021-01-17 john brown male 23 4504 23 de agosto smithamanda@gmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2021-01-17 joseph briggs male 24 8415 arroyo las minas hernandezbrian@gmail.com +univ. nacional del comahue licenciatura en terapia ocupacional 2021-01-17 elizabeth leblanc female 31 9407 28 de noviembre shelley61@gmail.com +univ. nacional del comahue ingeniería electrónica 2021-01-18 amber brown female 23 3206 bella union paraje rachelmcdonald@yahoo.com +univ. nacional del comahue licenciatura en ciencias ambientales 2021-01-18 kristin perkins female 21 3355 arrechea samuel60@gmail.com +univ. nacional del comahue actuario 2021-01-18 dawn hughes female 17 1613 los polvorines sharon90@hotmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2021-01-18 ann jordan female 39 5609 aristides villanueva richard96@yahoo.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2021-01-18 nicholas fisher male 21 5260 acheral harrisrobert@yahoo.com +univ. nacional del comahue licenciatura en ciencia política 2021-01-18 joshua jones male 27 3346 bacacay hendersonchristopher@yahoo.com +univ. nacional del comahue ingeniería en informática 2021-01-18 justin alvarado male 29 1816 colonia santa rosa harrymason@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la educación 2021-01-18 grace reynolds female 17 3081 cavour christopher92@yahoo.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2021-01-18 kristie drake female 37 7630 hospital necochea williamssamantha@yahoo.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2021-01-19 aaron kim male 39 6721 azcuenaga christopherwood@yahoo.com +univ. nacional del comahue medicina 2021-01-19 nicole castaneda female 21 4109 alto nuestra señora del valle nicole64@hotmail.com +univ. nacional del comahue licenciatura en ciencias geológicas 2021-01-19 rickey williams male 21 2202 cerana seth53@gmail.com +univ. nacional del comahue técnico para bioterios 2021-01-19 cristina humphrey female 25 1804 canning anneconway@gmail.com +univ. nacional del comahue agronomía 2021-01-19 meagan harmon female 27 9101 alto de las plumas wendyfigueroa@hotmail.com +univ. nacional del comahue técnico para bioterios 2021-01-19 louis bennett male 37 2717 acevedo karen93@gmail.com +univ. nacional del comahue licenciatura en musicoterapia 2021-01-19 jill sanford female 29 2449 avena wcox@gmail.com +univ. nacional del comahue medicina 2021-01-19 joshua brown male 23 2309 colonia reina margarita kmccullough@gmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2021-01-19 ryan maldonado male 27 1746 francisco alvarez gavinharris@gmail.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2021-01-19 andrea randolph female 21 5755 alto del molle santosheidi@gmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2021-01-19 david rowe male 31 7167 carilo luis40@gmail.com +univ. nacional del comahue licenciatura en sociología 2021-01-19 ryan clay male 33 2255 campo rodriguez michael23@gmail.com +univ. nacional del comahue contador público 2021-01-19 jon key male 39 2309 colonia reina margarita gcooper@yahoo.com +univ. nacional del comahue ingeniería mecánica 2021-01-19 john wright male 29 1614 villa de mayo kimberlystone@gmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2021-01-19 peter williams male 31 6723 cucullu ashley12@hotmail.com +univ. nacional del comahue actuario 2021-01-19 rebekah rios female 37 8309 centenario timothyeverett@gmail.com +univ. nacional del comahue bioquímica 2021-01-19 christine reynolds female 19 9121 aguada de las tejas aprilclark@gmail.com +univ. nacional del comahue licenciatura en artes 2021-01-20 robert guerrero male 37 7406 aldecon zporter@hotmail.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2021-01-20 katelyn wright female 21 3563 colonia san manuel glewis@gmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2021-01-20 melanie oconnor female 39 3190 arroyo hondo justinbell@gmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2021-01-20 george cuevas male 35 3254 colonia la blanquita wendyknight@hotmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2021-01-20 mary alvarez female 33 9035 arroyo chalia iwright@yahoo.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2021-01-20 sheri schroeder female 25 5701 11 de mayo burnsnicole@gmail.com +univ. nacional del comahue diseño industrial 2021-01-21 jerome manning male 39 7612 camet brownbrian@yahoo.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2021-01-21 tina thomas female 33 1670 nordelta jessica34@yahoo.com +univ. nacional del comahue licenciatura en administración 2021-01-21 michael palmer male 33 6101 villa saboya theresahernandez@gmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2021-01-21 erica pace female 29 3016 san jose alison24@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2021-01-21 kevin alexander male 35 2919 copacabana jaredgrimes@yahoo.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2021-01-21 ashley hughes female 19 3363 25 de mayo ibyrd@yahoo.com +univ. nacional del comahue ciencias veterinarias 2021-01-21 jonathan ortega male 21 2248 bernardo de irigoyen david52@hotmail.com +univ. nacional del comahue diseño de imagen y sonido 2021-01-21 julie crane female 37 3232 cabred wgibbs@gmail.com +univ. nacional del comahue diseño industrial 2021-01-21 jonathan thomas male 31 5407 dique toma amyandrews@gmail.com +univ. nacional del comahue licenciatura en ciencia política 2021-01-21 christina mcclure female 23 8103 garro bradfordkathleen@gmail.com +univ. nacional del comahue licenciatura en ciencias ambientales 2021-01-21 karen hurst female 23 7020 benito juarez rodney75@gmail.com +univ. nacional del comahue farmacia 2021-01-21 ricky lee male 37 8417 cañadon chileno stodd@hotmail.com +univ. nacional del comahue licenciatura en artes 2021-01-22 sharon davidson female 17 8508 ambrosio p lezica elijahhawkins@gmail.com +univ. nacional del comahue licenciatura en musicoterapia 2021-01-22 logan stone male 27 6705 villa ruiz stevengordon@hotmail.com +univ. nacional del comahue licenciatura en psicología 2021-01-22 jorge moore male 34 5547 villa hipodromo ryan99@hotmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2021-01-22 todd ochoa male 29 6551 juan f ibarra lmcmahon@yahoo.com +univ. nacional del comahue licenciatura en ciencias ambientales 2021-01-22 michael robinson male 25 7613 calfucura mfrancis@yahoo.com +univ. nacional del comahue licenciatura en ciencia política 2021-01-22 ryan jenkins male 23 6721 azcuenaga michael90@hotmail.com +univ. nacional del comahue ingeniería mecánica 2021-01-22 elizabeth martinez female 37 2146 clason hollowayricky@yahoo.com +univ. nacional del comahue técnico para bioterios 2021-01-23 molly farmer female 19 2720 colon aramirez@hotmail.com +univ. nacional del comahue licenciatura en artes 2021-01-23 kenneth flowers male 31 2754 campo crisol harristyler@gmail.com +univ. nacional del comahue bioquímica 2021-01-23 david greene male 17 2845 colonia duportal dalton68@yahoo.com +univ. nacional del comahue actuario 2021-01-23 charles wiley male 35 3440 barrio villa cordoba ashleysanchez@gmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2021-01-23 kevin hamilton male 37 4514 calilegua jacqueline98@yahoo.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2021-01-23 amy little female 21 5541 algarrobal abajo christy85@hotmail.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2021-01-23 mark arnold male 23 5773 cañada campbellsamantha@hotmail.com +univ. nacional del comahue arquitectura 2021-01-23 lauren wood female 19 3014 angel gallardo brandi48@gmail.com +univ. nacional del comahue agronomía 2021-01-23 roberta williams female 21 6387 caleufu michellewillis@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2021-01-23 dawn jefferson female 21 3551 campo monte la viruela juan36@yahoo.com +univ. nacional del comahue licenciatura en psicología 2021-01-23 kimberly price female 37 9303 cañadon del toro davidcooke@hotmail.com +univ. nacional del comahue licenciatura en administración 2021-01-23 barbara vaughn female 40 6017 chancay williamsonkayla@yahoo.com +univ. nacional del comahue medicina 2021-01-24 cynthia snyder female 34 2175 barlett webersabrina@yahoo.com +univ. nacional del comahue bioquímica 2021-01-24 daniel ortega male 37 6315 colonia baron frank71@hotmail.com +univ. nacional del comahue licenciatura en sociología 2021-01-24 joshua carter male 19 5711 angelita hgreer@yahoo.com +univ. nacional del comahue técnico para bioterios 2021-01-24 frank warren male 39 7106 las toninas ajohnson@gmail.com +univ. nacional del comahue ciencias veterinarias 2021-01-25 richard macias male 27 7307 crotto ykim@yahoo.com +univ. nacional del comahue diseño industrial 2021-01-25 brad hernandez male 33 5345 baños termales alyssa88@yahoo.com +univ. nacional del comahue diseño industrial 2021-01-25 kristine edwards female 37 4231 albigasta mduran@yahoo.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2021-01-25 brandi hall female 35 4504 23 de agosto pughtimothy@gmail.com +univ. nacional del comahue diseño de imagen y sonido 2021-01-25 tonya steele female 33 1646 san fernando latoya42@yahoo.com +univ. nacional del comahue licenciatura en kinesiología y fisiatría 2021-01-25 wendy parker female 35 1614 villa de mayo isanchez@gmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2021-01-25 regina griffin female 17 2607 campo quirno derekbarber@yahoo.com +univ. nacional del comahue licenciatura en ciencias de la computación 2021-01-25 james peterson male 23 3522 el retiro umckee@hotmail.com +univ. nacional del comahue bioquímica 2021-01-25 deanna evans female 39 3156 betbeder christopher84@yahoo.com +univ. nacional del comahue licenciatura en artes 2021-01-25 allison hernandez female 19 8412 cañadon del corral daltonwilliam@hotmail.com +univ. nacional del comahue agronomía 2021-01-25 keith brown male 33 5773 cañada samanthagordon@gmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2021-01-25 richard booth male 33 2183 arequito mortonstacy@gmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2021-01-26 stephanie mcknight female 23 7505 balneario claromeco xflores@gmail.com +univ. nacional del comahue licenciatura en artes 2021-01-26 cynthia carter female 37 1631 villa rosa jessica97@yahoo.com +univ. nacional del comahue diseño industrial 2021-01-26 candace jones female 23 9305 cañada de las vacas hardinkeith@yahoo.com +univ. nacional del comahue licenciatura en artes 2021-01-26 christopher jackson male 29 5735 colonia bella vista calderonbrittany@gmail.com +univ. nacional del comahue diseño industrial 2021-01-26 diana hall female 39 3125 antonio tomas richard95@yahoo.com +univ. nacional del comahue ingeniería en informática 2021-01-26 tyler irwin male 25 8316 balsa senillosa dunntracy@hotmail.com +univ. nacional del comahue licenciatura en ciencia política 2021-01-26 benjamin foster male 38 4622 bella vista brandimccullough@hotmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2021-01-26 christopher watts male 32 9050 gobernador moyano gsnyder@yahoo.com +univ. nacional del comahue bioquímica 2021-01-26 heidi warren female 23 1655 jose leon suarez mweaver@yahoo.com +univ. nacional del comahue bioquímica 2021-01-26 jamie martin female 37 2216 campo raffo anne53@hotmail.com +univ. nacional del comahue licenciatura en ciencias antropológicas 2021-01-26 todd gordon male 29 3381 maria magdalena muellerdonna@gmail.com +univ. nacional del comahue actuario 2021-01-26 devin williams male 25 1832 lomas de zamora joseph95@gmail.com +univ. nacional del comahue bioquímica 2021-01-26 william contreras male 25 2201 ricardone nicolejones@hotmail.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2021-01-27 timothy hernandez male 35 5321 el potrero juliekim@gmail.com +univ. nacional del comahue licenciatura en artes 2021-01-27 jessica curry female 20 1907 el pino jeffrey86@gmail.com +univ. nacional del comahue diseño industrial 2021-01-27 nicholas henson male 23 2843 general galarza jameskevin@gmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2021-01-27 matthew bridges male 17 1984 domselaar taylorperez@hotmail.com +univ. nacional del comahue agronomía 2021-01-27 courtney bryan female 31 1856 glew howardzachary@hotmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2021-01-27 brandon perez male 36 2805 arroyo aleli michellesanchez@yahoo.com +univ. nacional del comahue bioquímica 2021-01-27 herbert jackson male 37 5311 arauco solismichael@hotmail.com +univ. nacional del comahue ingeniería en informática 2021-01-27 gina hoffman female 35 2503 villa eloisa michael52@hotmail.com +univ. nacional del comahue agronomía 2021-01-27 troy harris male 37 3011 campo magnin beverlycox@gmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2021-01-27 michael morales male 18 2763 flamenco mcfarlandjohnny@yahoo.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2021-01-27 christopher salazar male 17 6505 dudignac connor46@yahoo.com +univ. nacional del comahue licenciatura en ciencias de la educación 2021-01-28 brandon lang male 17 9220 cañadon la madera josephboyd@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2021-01-28 patrick christensen male 33 2622 maggiolo jacqueline29@gmail.com +univ. nacional del comahue licenciatura en musicoterapia 2021-01-28 geoffrey taylor male 27 5560 arroyo claro margaret95@gmail.com +univ. nacional del comahue actuario 2021-01-28 roy michael male 17 5557 caracoles gregory43@hotmail.com +univ. nacional del comahue diseño de imagen y sonido 2021-01-28 nicole black female 29 1768 ciudad madero choicarrie@yahoo.com +univ. nacional del comahue licenciatura en ciencias biológicas 2021-01-28 lisa espinoza female 31 9220 cañadon la madera steven98@gmail.com +univ. nacional del comahue ingeniería electrónica 2021-01-28 amber hawkins female 33 3449 boliche lata ryan00@gmail.com +univ. nacional del comahue licenciatura en ciencias ambientales 2021-01-28 alicia haley female 22 3023 cululu shafferjoseph@gmail.com +univ. nacional del comahue ciencias veterinarias 2021-01-28 justin mcdonald male 25 6513 colonia las yescas zthomas@hotmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2021-01-28 monique cervantes female 19 5421 la tranca sarah24@hotmail.com +univ. nacional del comahue licenciatura en musicoterapia 2021-01-28 whitney carr female 17 5501 cerrillos al sud christina10@yahoo.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2021-01-28 robert smith male 23 1885 guillermo e hudson markrussell@hotmail.com +univ. nacional del comahue licenciatura en terapia ocupacional 2021-01-28 brian richards male 35 1735 el durazno brownelizabeth@hotmail.com +univ. nacional del comahue licenciatura en ciencias ambientales 2021-01-29 ashley frost female 25 8521 arroyo de la ventana hrasmussen@hotmail.com +univ. nacional del comahue licenciatura en musicoterapia 2021-01-29 jill terry female 25 2747 coronel isleños jeffreygarner@hotmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2021-01-29 debra johnson female 29 6078 bayauca langjeremy@yahoo.com +univ. nacional del comahue licenciatura en relaciones del trabajo 2021-01-29 stephanie logan female 35 7605 barrio chapadmalal yfisher@hotmail.com +univ. nacional del comahue diseño industrial 2021-01-29 melissa daniels female 29 4518 aguas calientes riveraeric@yahoo.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2021-01-29 casey ward male 37 2177 bigand ryan94@yahoo.com +univ. nacional del comahue licenciatura en psicología 2021-01-29 jennifer davis female 21 6453 carlos salas lhernandez@hotmail.com +univ. nacional del comahue licenciatura en musicoterapia 2021-01-29 lindsey kim female 25 7114 canal 15 cerro de la gloria davidbush@hotmail.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2021-01-29 darren holmes male 21 3076 huanqueros jhall@yahoo.com +univ. nacional del comahue contador público 2021-01-29 felicia smith female 35 2707 4 de noviembre robinsoncaitlin@yahoo.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2021-01-29 rachel malone female 25 9040 cañadon botello james64@gmail.com +univ. nacional del comahue ingeniería mecánica 2021-01-29 lisa perry female 33 3117 aldea san antonio basssarah@yahoo.com +univ. nacional del comahue actuario 2021-01-29 timothy brown male 19 5743 la isabel jonathanmiller@hotmail.com +univ. nacional del comahue diseño industrial 2021-01-29 debra johnson female 17 3443 colonia mendez bar loveian@yahoo.com +univ. nacional del comahue licenciatura en ciencias ambientales 2021-01-29 carrie johnson female 33 6305 atreuco nmclean@hotmail.com +univ. nacional del comahue licenciatura en ciencias de la computación 2021-01-30 sarah johnston female 23 1607 villa adelina ubush@gmail.com +univ. nacional del comahue licenciatura en ciencia y tecnología de alimentos 2021-01-30 kelly simpson female 31 5624 kilometro 47 ycoffey@yahoo.com +univ. nacional del comahue licenciatura en ciencias biológicas 2021-01-30 linda nash female 29 5275 agua colorada ortegadave@hotmail.com +univ. nacional del comahue ingeniería mecánica 2021-01-30 jonathan taylor male 17 2943 ireneo portela alanbennett@yahoo.com +univ. nacional del comahue licenciatura en ciencias de la computación 2021-01-30 isaac suarez male 17 4109 alto nuestra señora del valle alawrence@yahoo.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2021-01-30 allen phelps male 39 3188 colonia falco yharris@hotmail.com +univ. nacional del comahue diseño de imagen y sonido 2021-01-30 gregory wright male 33 6475 esteban de luca sarahsloan@yahoo.com +univ. nacional del comahue licenciatura en ciencias ambientales 2021-01-30 jeffrey ward male 35 6665 ernestina jasmine13@gmail.com +univ. nacional del comahue licenciatura en ciencia política 2021-01-30 emily alexander female 33 4187 anta chica zparrish@hotmail.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2021-01-30 richard rice male 40 1980 barrio la dolly moralesthomas@hotmail.com +univ. nacional del comahue licenciatura en musicoterapia 2021-01-30 john simpson male 39 3342 aguapey jenna23@yahoo.com +univ. nacional del comahue licenciatura en terapia ocupacional 2021-01-30 cory church male 17 3334 3 de mayo ashleywilliams@gmail.com +univ. nacional del comahue bioquímica 2021-01-30 shawn hahn male 29 8115 bajo hondo christy55@gmail.com +univ. nacional del comahue ingeniería electrónica 2021-01-30 richard harrison male 37 3071 aguara grande pierceheather@gmail.com +univ. nacional del comahue licenciatura en administración 2021-01-30 russell davis male 37 6405 30 de agosto dchan@gmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2021-01-30 lawrence wheeler male 31 5272 comandante leal paulthomas@hotmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2021-01-30 william price male 27 2732 4 de febrero swansonjoseph@gmail.com +univ. nacional del comahue diseño industrial 2021-01-30 katrina cooke female 27 3376 gobernador lanusse michelesmith@gmail.com +univ. nacional del comahue diseño industrial 2021-01-30 kristen lucero female 35 1923 arroyo del pescado whitematthew@hotmail.com +univ. nacional del comahue medicina 2021-01-30 teresa cooper female 35 3328 colonia japonesa xmann@gmail.com +univ. nacional del comahue licenciatura en planificación y diseño del paisaje 2021-01-31 angela copeland female 38 6513 colonia las yescas edaniels@yahoo.com +univ. nacional del comahue licenciatura en ciencias biológicas 2021-01-31 christopher estrada male 29 2812 capilla del señor williamporter@hotmail.com +univ. nacional del comahue medicina 2021-01-31 megan glover female 19 8129 17 de agosto jonesdeborah@hotmail.com +univ. nacional del comahue ingeniería en informática 2021-01-31 anna richmond female 37 4753 corralito fthompson@yahoo.com +univ. nacional del comahue licenciatura en gestión de agroalimentos 2021-01-31 william taylor male 29 2449 avena holly49@gmail.com +univ. nacional del comahue licenciatura en ciencia política 2021-01-31 theresa gonzales female 29 8208 campo cicare palmerlori@gmail.com +univ. nacional del comahue diseño de imagen y sonido 2021-01-31 ashley osborne female 31 2715 el socorro rcoffey@hotmail.com +univ. nacional del comahue licenciatura en ciencia política 2021-01-31 alan crane male 31 2216 campo raffo brandi05@yahoo.com +univ. nacional del comahue licenciatura en sociología 2021-01-31 troy mason male 27 6345 la bilbaina margaret95@yahoo.com +univ. nacional del comahue licenciatura en producción de bioimagenes 2021-01-31 lisa hanna female 17 2615 la gama mcdonaldjoshua@hotmail.com +univ. nacional del comahue licenciatura en ciencias biológicas 2021-01-31 lance williams male 40 7247 barrientos jennifer42@gmail.com +univ. nacional del comahue diseño de imagen y sonido 2021-01-31 abigail mays female 31 9225 arenoso maria16@yahoo.com +univ. nacional del comahue agronomía 2021-01-31 ryan davis male 37 3328 colonia japonesa patriciazamora@gmail.com +univ. nacional del comahue diseño de imagen y sonido 2021-02-01 james hodge male 27 8160 fortin chaco norrisstephen@gmail.com +univ. nacional del comahue diseño industrial 2021-02-01 jennifer bryant female 25 8319 campamento sol fjohnson@yahoo.com +univ. nacional del comahue técnico para bioterios 2021-02-01 keith richardson male 39 3466 abalo kingjoseph@yahoo.com +univ. nacional del comahue licenciatura en ciencias biológicas 2021-02-01 richard robles male 23 8324 cipolletti kylegraham@hotmail.com +univ. nacional del comahue licenciatura en artes 2021-02-01 stephanie williams female 23 5471 agua blanca jvaldez@hotmail.com +univ. nacional del comahue diseño industrial 2021-02-01 jennifer cohen female 38 4157 arroyo mal paso rramirez@hotmail.com +univ. nacional del comahue agronomía 2021-02-01 paul byrd male 23 1746 francisco alvarez sheila73@yahoo.com diff --git a/datasets/GBUNSalvador_process.txt b/datasets/GBUNSalvador_process.txt new file mode 100644 index 00000000..fb023355 --- /dev/null +++ b/datasets/GBUNSalvador_process.txt @@ -0,0 +1,1905 @@ +university career inscription_date first_name last_name gender age postal_code location email +universidad del salvador licenciatura en ciencias de la computación 2020-09-01 carol doyle female 37 3254 colonia la blanquita anthony88@gmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-09-01 heidi tran female 27 8514 laguna del barro todd44@hotmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-09-01 rachael harrington female 23 7243 antonio carboni zcantrell@yahoo.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-09-01 ryan silva male 19 5272 comandante leal heather60@gmail.com +universidad del salvador ingeniería mecánica 2020-09-01 tiffany knight female 29 6533 alfredo demarchi bwarner@gmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-09-01 tyler ross male 25 2813 arroyo de la cruz martinezstephanie@gmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-09-01 caitlyn farrell female 17 9033 aldea apeleg droman@hotmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-09-01 albert reilly male 35 8409 puerto ojo de agua amysimmons@yahoo.com +universidad del salvador actuario 2020-09-01 kim garza female 23 5753 agua linda lwilson@hotmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-09-01 donna hicks female 31 8301 planicie banderita kelleyjames@gmail.com +universidad del salvador farmacia 2020-09-01 david nguyen male 23 2240 campo garcia owendawn@yahoo.com +universidad del salvador diseño industrial 2020-09-02 nancy hopkins female 27 2705 haras san jacinto tarakoch@gmail.com +universidad del salvador licenciatura en relaciones del trabajo 2020-09-02 anna williams female 37 6645 la limpia elizabeth50@yahoo.com +universidad del salvador medicina 2020-09-02 darrell villa male 25 5471 agua blanca skim@gmail.com +universidad del salvador ingeniería mecánica 2020-09-02 tammy young female 17 5553 empalme frontera usherman@gmail.com +universidad del salvador licenciatura en ciencias ambientales 2020-09-02 rachel miller female 33 8170 abra de hinojo brian17@gmail.com +universidad del salvador ingeniería electrónica 2020-09-02 kristen long female 24 2347 colonia mackinlay beardmelinda@yahoo.com +universidad del salvador licenciatura en terapia ocupacional 2020-09-02 angela wilson female 27 5261 agua del simbol teresa23@gmail.com +universidad del salvador licenciatura en relaciones del trabajo 2020-09-02 melanie chan female 25 5621 agua de torre hooverjames@hotmail.com +universidad del salvador licenciatura en ciencias ambientales 2020-09-02 vincent romero male 39 6723 cucullu vpeterson@hotmail.com +universidad del salvador actuario 2020-09-02 sharon maldonado female 37 7637 la dulce xcalderon@yahoo.com +universidad del salvador licenciatura en ciencias ambientales 2020-09-02 shawn holt male 27 3060 campo san jose nathan85@yahoo.com +universidad del salvador licenciatura en musicoterapia 2020-09-02 melissa wright female 29 4182 campo la flor los ralos vwilson@hotmail.com +universidad del salvador licenciatura en relaciones del trabajo 2020-09-02 hailey lee female 19 6244 banderalo sextonreginald@hotmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-09-02 melissa larson female 19 8308 villa manzano bryantshelby@hotmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-09-02 tiffany fields female 39 1907 el pino frenchbrian@hotmail.com +universidad del salvador diseño de imagen y sonido 2020-09-02 tracy crawford female 17 8111 arroyo pareja josejackson@hotmail.com +universidad del salvador licenciatura en ciencias geológicas 2020-09-03 joann howell female 29 6361 agustoni wongcaleb@yahoo.com +universidad del salvador licenciatura en producción de bioimagenes 2020-09-03 lauren frederick female 21 7119 cari larquea colton79@yahoo.com +universidad del salvador ciencias veterinarias 2020-09-03 sandra arroyo female 19 1748 general rodriguez xjohnson@gmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-09-03 caroline james female 21 5575 andrade phillipsshirley@hotmail.com +universidad del salvador licenciatura en ciencia política 2020-09-03 christina wilkinson female 23 6501 12 de octubre dunlapmarcus@gmail.com +universidad del salvador licenciatura en sociología 2020-09-03 amy smith female 35 1640 acassuso martinezmichael@hotmail.com +universidad del salvador ciencias veterinarias 2020-09-03 nicole bryan female 25 8400 isla victoria mmiller@gmail.com +universidad del salvador licenciatura en ciencias geológicas 2020-09-03 christopher johnson male 39 2456 esmeralda conwaywilliam@gmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-09-03 kristen michael female 37 7249 el araza robertnguyen@yahoo.com +universidad del salvador licenciatura en terapia ocupacional 2020-09-03 michael cole male 17 8172 arroyo corto thompsonjames@hotmail.com +universidad del salvador licenciatura en psicología 2020-09-03 adrian nguyen male 24 5467 acerillos emily62@gmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-09-03 james esparza male 29 3309 arroyo tomas benjamin89@hotmail.com +universidad del salvador farmacia 2020-09-03 steven robinson male 19 9420 aserradero arroyo iphillips@yahoo.com +universidad del salvador ingeniería en informática 2020-09-04 joyce faulkner female 18 1909 arana moorechristopher@gmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-09-04 dawn flores female 23 2741 el retiro debbie46@yahoo.com +universidad del salvador contador público 2020-09-04 kevin kim male 39 6077 encina miranda39@yahoo.com +universidad del salvador licenciatura en musicoterapia 2020-09-04 eric foster male 25 8133 la rosa carolynreyes@hotmail.com +universidad del salvador licenciatura en ciencia política 2020-09-04 shaun harris male 33 2177 bigand smithstephanie@gmail.com +universidad del salvador ingeniería electrónica 2020-09-04 jonathan mccarthy male 17 6537 el camoati sarahmooney@hotmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-09-04 pamela williams female 29 5409 adan quiroga stevensonjacob@yahoo.com +universidad del salvador licenciatura en producción de bioimagenes 2020-09-04 michael brown male 37 1836 llavallol derrick97@yahoo.com +universidad del salvador licenciatura en ciencias antropológicas 2020-09-04 megan schwartz female 23 2820 colonia el potrero swansongregory@yahoo.com +universidad del salvador licenciatura en ciencias de la educación 2020-09-04 karen williams female 35 3129 colonia hernandarias teresa05@hotmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-09-04 jennifer gregory female 27 6231 cuenca johnsondennis@gmail.com +universidad del salvador contador público 2020-09-04 jessica brown female 29 3465 arroyo casco ryanporter@gmail.com +universidad del salvador licenciatura en administración 2020-09-04 brenda hurst female 37 2400 villani justin13@yahoo.com +universidad del salvador actuario 2020-09-04 stacey meyer female 25 7621 la sara ganthony@yahoo.com +universidad del salvador licenciatura en ciencias biológicas 2020-09-05 samuel parker male 27 2535 el trebol qsims@gmail.com +universidad del salvador ciencias veterinarias 2020-09-05 mason carpenter male 33 5753 agua linda paul92@gmail.com +universidad del salvador arquitectura 2020-09-05 thomas gillespie male 17 3421 bajo guazu gcrawford@hotmail.com +universidad del salvador bioquímica 2020-09-05 kenneth smith male 23 3480 algarrobal marvinfuller@gmail.com +universidad del salvador diseño de imagen y sonido 2020-09-05 michael kelly male 17 6559 recalde harrisjeremy@yahoo.com +universidad del salvador farmacia 2020-09-05 caroline moore female 17 5513 barrio jardin luzuriaga jasonthomas@hotmail.com +universidad del salvador licenciatura en artes 2020-09-05 james bradley male 26 6550 bolivar porterdanielle@hotmail.com +universidad del salvador licenciatura en ciencias biológicas 2020-09-05 jason swanson male 33 7536 estacion coronel pringles christine98@hotmail.com +universidad del salvador diseño industrial 2020-09-05 richard vasquez male 27 4105 abra del tafi davidcourtney@yahoo.com +universidad del salvador licenciatura en terapia ocupacional 2020-09-05 lindsey green female 21 5547 villa hipodromo lrosales@gmail.com +universidad del salvador ciencias veterinarias 2020-09-05 trevor jackson male 31 5770 chacras viejas angela25@gmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-09-05 allison estrada female 27 6511 hale kelly47@hotmail.com +universidad del salvador diseño de imagen y sonido 2020-09-06 samantha hinton female 27 3534 colonia el aguara kleinchristina@hotmail.com +universidad del salvador licenciatura en ciencias ambientales 2020-09-06 samuel wallace male 33 2148 campo castro ofernandez@yahoo.com +universidad del salvador licenciatura en ciencias biológicas 2020-09-06 stacy webb female 31 5557 caracoles brianlewis@hotmail.com +universidad del salvador diseño industrial 2020-09-06 donna lane female 17 2639 berabevu gthompson@gmail.com +universidad del salvador medicina 2020-09-06 ryan garza male 17 2760 colonia los tres usaris michael47@yahoo.com +universidad del salvador ciencias veterinarias 2020-09-06 kimberly cardenas female 31 7200 el gualicho xcopeland@yahoo.com +universidad del salvador diseño industrial 2020-09-06 jacqueline adams female 27 6640 asamblea douglasromero@hotmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-09-06 karen wilson female 17 6475 esteban de luca kristine32@gmail.com +universidad del salvador licenciatura en ciencias geológicas 2020-09-06 sharon donaldson female 37 7136 adela scastillo@hotmail.com +universidad del salvador ingeniería electrónica 2020-09-06 steven romero male 33 7407 libano andersondebra@yahoo.com +universidad del salvador licenciatura en ciencias geológicas 2020-09-06 lisa swanson female 37 2930 la buana moza mrivera@gmail.com +universidad del salvador ingeniería mecánica 2020-09-06 jenna wilson female 29 3372 cataratas del iguazu sarahharris@hotmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-09-06 matthew griffin male 35 4184 bustamante diazeric@yahoo.com +universidad del salvador actuario 2020-09-07 joseph meadows male 37 1882 ezpeleta este sara20@gmail.com +universidad del salvador ingeniería mecánica 2020-09-07 stephanie hart female 24 5609 aristides villanueva patelsamuel@yahoo.com +universidad del salvador licenciatura en ciencias biológicas 2020-09-07 james robinson male 20 3162 aranguren robinsonpamela@yahoo.com +universidad del salvador licenciatura en psicología 2020-09-07 carolyn watson female 27 1651 san andres griffinmatthew@hotmail.com +universidad del salvador licenciatura en musicoterapia 2020-09-07 ralph jones male 17 6612 capdepont hensontracy@yahoo.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-09-07 john king male 25 6720 kilometro 125 richardmartinez@hotmail.com +universidad del salvador bioquímica 2020-09-07 julie garcia female 26 6712 cortines basserik@gmail.com +universidad del salvador técnico para bioterios 2020-09-07 thomas wood male 37 5501 cerrillos al sud cynthiawolf@hotmail.com +universidad del salvador diseño de imagen y sonido 2020-09-07 thomas flores male 31 3074 colonia el simbol rphillips@gmail.com +universidad del salvador medicina 2020-09-07 carlos richards male 29 6007 arribeños brittany00@gmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-09-07 kevin freeman male 19 7241 la porteña monicamayo@hotmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-09-08 robert clark male 20 6317 la florencia anthony05@hotmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-09-08 tracy castillo male 17 5543 3 de mayo jamesandrade@gmail.com +universidad del salvador ingeniería electrónica 2020-09-08 sharon shepard female 24 1731 villars taylorjames@yahoo.com +universidad del salvador licenciatura en ciencias ambientales 2020-09-08 cheryl schroeder female 37 2812 capilla del señor emacdonald@yahoo.com +universidad del salvador agronomía 2020-09-08 jesse baldwin male 23 5436 colonia zapata snyderbrian@hotmail.com +universidad del salvador licenciatura en ciencias biológicas 2020-09-08 olivia peterson female 33 3551 campo monte la viruela brianariley@hotmail.com +universidad del salvador licenciatura en ciencias biológicas 2020-09-08 alan oneill male 19 2132 aero club rosario eglover@hotmail.com +universidad del salvador licenciatura en musicoterapia 2020-09-08 taylor burns male 18 1986 altamirano miguelwhite@hotmail.com +universidad del salvador licenciatura en ciencias geológicas 2020-09-08 xavier miller male 39 3158 20 de septiembre jeremyrhodes@yahoo.com +universidad del salvador medicina 2020-09-09 rachel gamble female 33 8371 atreuco reginafranklin@hotmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-09-09 sean moore male 27 1731 villars thomasolivia@yahoo.com +universidad del salvador licenciatura en musicoterapia 2020-09-09 thomas day male 17 6013 baigorrita maxwilliams@gmail.com +universidad del salvador contador público 2020-09-09 brandi patterson female 25 3423 arañita patrickwright@hotmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-09-09 gregory johnson male 39 5369 pagancillo carriejohnson@gmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-09-09 jonathan jones male 33 5276 baldes de pacheco waltercombs@yahoo.com +universidad del salvador agronomía 2020-09-09 kimberly gonzalez female 21 8183 avestruz schmidtmaria@hotmail.com +universidad del salvador licenciatura en artes 2020-09-09 todd tucker male 33 4751 agua de dionisio michael85@hotmail.com +universidad del salvador licenciatura en psicología 2020-09-09 timothy thomas male 33 3453 ifran afisher@hotmail.com +universidad del salvador licenciatura en musicoterapia 2020-09-09 adam brown male 17 5750 alto de la leña umyers@yahoo.com +universidad del salvador ingeniería mecánica 2020-09-09 ricky meyer male 24 7135 comandante giribone gordon94@hotmail.com +universidad del salvador licenciatura en sociología 2020-09-09 melissa walker female 17 2147 san genaro norte mward@gmail.com +universidad del salvador diseño industrial 2020-09-09 debra fowler female 37 3448 alamo aaronsmith@hotmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-09-09 mitchell ellison male 27 3386 caraguatay fgibson@hotmail.com +universidad del salvador licenciatura en ciencias biológicas 2020-09-09 heather washington female 17 3228 cabi monda campbelljames@hotmail.com +universidad del salvador bioquímica 2020-09-09 sheila wong female 29 3158 20 de septiembre smartin@gmail.com +universidad del salvador licenciatura en producción de bioimagenes 2020-09-09 anna martinez female 23 3311 arroyo isabel ldunn@gmail.com +universidad del salvador contador público 2020-09-09 katherine medina female 31 2148 campo castro reginald04@hotmail.com +universidad del salvador diseño de imagen y sonido 2020-09-10 latasha smith female 19 1611 don torcuato brett19@hotmail.com +universidad del salvador licenciatura en ciencias biológicas 2020-09-10 erica bailey female 23 3708 concepcion del bermejo tami08@hotmail.com +universidad del salvador ingeniería en informática 2020-09-10 joshua palmer male 27 7241 la porteña mark21@hotmail.com +universidad del salvador diseño industrial 2020-09-10 john oneal male 35 4162 batiruana john08@gmail.com +universidad del salvador licenciatura en administración 2020-09-10 jessica williams female 33 2523 bouquet wagnermaria@yahoo.com +universidad del salvador ingeniería electrónica 2020-09-10 jonathan kennedy male 39 4634 abralaite jamesjackson@hotmail.com +universidad del salvador farmacia 2020-09-10 jonathan lam male 35 3536 bocas latoyagould@gmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-09-10 tammy sanchez female 21 8168 sierra de la ventana samanthagibson@hotmail.com +universidad del salvador contador público 2020-09-10 justin ward male 33 7547 cascada heather47@yahoo.com +universidad del salvador bioquímica 2020-09-10 janet jenkins female 39 6300 barrancas coloradas patrick54@gmail.com +universidad del salvador técnico para bioterios 2020-09-10 christine conner female 27 6105 cañada seca justinbrown@yahoo.com +universidad del salvador diseño de imagen y sonido 2020-09-10 ronald kennedy male 27 1708 moron khanlisa@gmail.com +universidad del salvador ciencias veterinarias 2020-09-11 veronica white female 31 7303 altona hendersonmegan@hotmail.com +universidad del salvador licenciatura en artes 2020-09-11 ana graves female 23 3421 bajo guazu rosalesclaudia@gmail.com +universidad del salvador ciencias veterinarias 2020-09-11 michael scott male 21 7020 benito juarez williamsonsarah@yahoo.com +universidad del salvador licenciatura en ciencia política 2020-09-11 bryce navarro male 29 6003 ascencion brownsydney@hotmail.com +universidad del salvador licenciatura en administración 2020-09-11 taylor williams male 39 1744 cuartel v nwalls@hotmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-09-11 angel mosley female 19 9305 cañada de las vacas andrewmartin@yahoo.com +universidad del salvador licenciatura en ciencias de la educación 2020-09-11 willie solis male 39 1927 esc nav militar rio sant aaron89@hotmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-09-11 david thompson male 18 6389 alegria brianstanton@hotmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-09-11 jim cox male 29 3315 caa yari oliverevelyn@yahoo.com +universidad del salvador licenciatura en ciencias de la educación 2020-09-11 diane warren female 35 3371 cabure hedwards@yahoo.com +universidad del salvador ingeniería electrónica 2020-09-11 julie thompson female 37 3476 el remanso thomas62@gmail.com +universidad del salvador farmacia 2020-09-12 kristopher wilkins male 23 3433 carrizal norte hughesrachel@yahoo.com +universidad del salvador actuario 2020-09-12 tina hill female 25 1814 barrio 1 de mayo williamsonwilliam@yahoo.com +universidad del salvador ingeniería en informática 2020-09-12 elizabeth fletcher female 29 3283 colonia mabragaña rclark@yahoo.com +universidad del salvador licenciatura en administración 2020-09-12 miguel williams male 19 4145 ingenio la providencia ccarter@yahoo.com +universidad del salvador licenciatura en ciencias antropológicas 2020-09-12 matthew conley male 19 7249 el araza watsonmelissa@hotmail.com +universidad del salvador licenciatura en artes 2020-09-12 steven bowman male 25 4107 aconquija ykim@gmail.com +universidad del salvador licenciatura en sociología 2020-09-12 george washington male 21 6648 mecha ttaylor@yahoo.com +universidad del salvador agronomía 2020-09-12 natasha edwards female 25 8415 arroyo las minas adamramirez@gmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-09-13 marcus payne male 39 5413 apeadero las chimbas ericsullivan@yahoo.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-09-13 yolanda harris female 25 3051 alejandra brendahodges@yahoo.com +universidad del salvador medicina 2020-09-13 april joyce female 31 2633 chovet sandra83@yahoo.com +universidad del salvador técnico para bioterios 2020-09-13 jessica vega female 23 1917 luis chico vwashington@hotmail.com +universidad del salvador licenciatura en ciencias ambientales 2020-09-13 jason shea male 35 3216 arroyo hondo ronalddean@gmail.com +universidad del salvador licenciatura en sociología 2020-09-13 frank weaver male 33 6051 ingeniero balbin vickiewood@yahoo.com +universidad del salvador licenciatura en musicoterapia 2020-09-13 michele tucker female 21 5276 baldes de pacheco adavis@yahoo.com +universidad del salvador licenciatura en ciencias antropológicas 2020-09-14 andrew le male 33 3423 arañita dorothy42@yahoo.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-09-14 jacob goodwin male 25 7631 costa bonita balneario timothy92@gmail.com +universidad del salvador agronomía 2020-09-14 michael munoz male 23 4234 achalco whitney22@yahoo.com +universidad del salvador licenciatura en ciencias de la educación 2020-09-14 kimberly floyd female 23 2840 albardon paulburch@gmail.com +universidad del salvador ingeniería mecánica 2020-09-14 terri oneal female 35 5624 kilometro 47 wandamiller@gmail.com +universidad del salvador arquitectura 2020-09-14 julie murray female 25 6603 ingeniero williams swilson@yahoo.com +universidad del salvador ingeniería en informática 2020-09-14 nicholas alvarez male 37 8307 colonia gobernador ayala sarah42@yahoo.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-09-14 collin stewart male 29 3621 pozo navagan cassiejohnson@gmail.com +universidad del salvador licenciatura en musicoterapia 2020-09-14 william bell male 23 6663 juan vela nicole13@hotmail.com +universidad del salvador bioquímica 2020-09-14 charles hayden male 25 4506 alegria jody40@yahoo.com +universidad del salvador licenciatura en producción de bioimagenes 2020-09-14 tiffany brown female 19 7313 16 de julio charlesjames@gmail.com +universidad del salvador licenciatura en ciencia política 2020-09-14 john wells male 27 9023 buen pasto jason46@gmail.com +universidad del salvador ingeniería mecánica 2020-09-15 heather thomas female 33 4518 aguas calientes josephcoleman@yahoo.com +universidad del salvador licenciatura en ciencias de la educación 2020-09-15 erica perez female 37 1633 empalme hrichardson@hotmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-09-15 peter dunn male 24 2181 los molinos ngarrett@yahoo.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-09-15 becky mckee female 39 2508 armstrong anthonylopez@hotmail.com +universidad del salvador licenciatura en administración 2020-09-15 timothy brown male 25 3503 barranqueras logan69@gmail.com +universidad del salvador licenciatura en psicología 2020-09-15 kim carter female 35 2453 carlos pellegrini josephgill@hotmail.com +universidad del salvador medicina 2020-09-15 jason fisher male 25 3017 bajo las tunas stoutlarry@hotmail.com +universidad del salvador licenciatura en producción de bioimagenes 2020-09-15 laura mahoney female 21 2743 arroyo dulce ybraun@yahoo.com +universidad del salvador licenciatura en psicología 2020-09-15 andrew osborne male 26 2307 ataliva hmcclain@yahoo.com +universidad del salvador licenciatura en administración 2020-09-15 christopher bass male 21 2919 copacabana jerryhess@yahoo.com +universidad del salvador ingeniería mecánica 2020-09-15 renee cox female 26 3125 antonio tomas rbaker@hotmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-09-15 anna clark female 23 6317 la florencia smithbrian@gmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-09-15 penny huang female 37 6369 campo salusso robert89@hotmail.com +universidad del salvador licenciatura en sociología 2020-09-15 sydney english female 29 2456 esmeralda jerryarmstrong@yahoo.com +universidad del salvador contador público 2020-09-15 robert johnson male 23 6663 juan vela brownjane@yahoo.com +universidad del salvador licenciatura en musicoterapia 2020-09-15 james singh male 23 6703 alastuey pcooper@gmail.com +universidad del salvador contador público 2020-09-15 brandon thompson male 17 5549 agua de los manantiales farroyo@hotmail.com +universidad del salvador técnico para bioterios 2020-09-16 katherine baker female 22 3194 paso telegrafo angelasmith@gmail.com +universidad del salvador diseño de imagen y sonido 2020-09-16 rebecca johnson female 39 6230 francisco casal jenna90@yahoo.com +universidad del salvador licenciatura en ciencias ambientales 2020-09-16 jacob norris male 25 6535 bellocq nicolenelson@yahoo.com +universidad del salvador ingeniería mecánica 2020-09-16 yvonne fisher female 27 3340 boqueron parkerandrew@yahoo.com +universidad del salvador ingeniería en informática 2020-09-16 kim taylor female 33 8363 colonia josefa traciromero@gmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-09-16 jacqueline hernandez female 23 3317 arroyo magdalena dannymartin@yahoo.com +universidad del salvador licenciatura en ciencias antropológicas 2020-09-16 john oliver male 19 6472 francisco madero kevinperez@hotmail.com +universidad del salvador agronomía 2020-09-16 gloria cooper female 25 7408 la colina handerson@gmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-09-16 christina parsons female 26 2000 villa angelica pamelalawson@yahoo.com +universidad del salvador licenciatura en ciencias de la computación 2020-09-16 dustin burton male 35 6700 caminera lujan elizabeth75@gmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-09-16 tammy bryant female 17 8379 gente grande bradshawcourtney@gmail.com +universidad del salvador licenciatura en sociología 2020-09-16 james barrett male 27 5261 agua del simbol hogankarl@hotmail.com +universidad del salvador ingeniería mecánica 2020-09-16 michael meyer male 35 1682 martin coronado alyssastafford@yahoo.com +universidad del salvador licenciatura en terapia ocupacional 2020-09-16 jennifer collins female 21 3188 colonia falco wmorrow@hotmail.com +universidad del salvador licenciatura en relaciones del trabajo 2020-09-17 anthony miller male 21 6501 12 de octubre ejennings@yahoo.com +universidad del salvador contador público 2020-09-17 jennifer jimenez female 27 2631 cora tbailey@yahoo.com +universidad del salvador medicina 2020-09-17 nicholas case male 17 7637 la dulce xnorris@gmail.com +universidad del salvador ingeniería electrónica 2020-09-17 samuel brooks male 21 1834 temperley hannahwilliams@gmail.com +universidad del salvador ingeniería electrónica 2020-09-17 lori roberts female 20 6623 indacochea murraydoris@hotmail.com +universidad del salvador ciencias veterinarias 2020-09-17 joshua friedman male 25 1665 jose clemente paz vsmith@hotmail.com +universidad del salvador ciencias veterinarias 2020-09-17 david evans male 29 9041 los antiguos davidflores@yahoo.com +universidad del salvador licenciatura en administración 2020-09-17 jessica green female 21 6469 asturias hcrawford@yahoo.com +universidad del salvador licenciatura en musicoterapia 2020-09-17 gabriela weiss female 33 1670 nordelta stonecatherine@yahoo.com +universidad del salvador licenciatura en administración 2020-09-17 james gonzalez male 21 2747 coronel isleños josephjackson@hotmail.com +universidad del salvador licenciatura en ciencias biológicas 2020-09-17 taylor saunders female 31 7316 fortin irene amanda64@yahoo.com +universidad del salvador licenciatura en ciencias antropológicas 2020-09-17 raymond wilkinson male 37 8126 aldea san andres christopher41@hotmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-09-17 brandon keller male 39 2828 colonia nueva montevideo masonmatthew@gmail.com +universidad del salvador licenciatura en ciencias de la educación 2020-09-17 kathy soto female 19 6441 colonia baron hirsch randallrogers@yahoo.com +universidad del salvador agronomía 2020-09-17 andrea jackson female 23 2821 arroyo del cura robertsjose@hotmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-09-18 tristan gonzales male 24 6312 ricardo lavalle natasharodriguez@gmail.com +universidad del salvador farmacia 2020-09-18 earl martinez male 19 4178 abra rica william80@hotmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-09-18 brenda benson female 23 7100 dolores jeff02@gmail.com +universidad del salvador medicina 2020-09-18 breanna wells female 27 3363 25 de mayo josephthompson@yahoo.com +universidad del salvador ingeniería mecánica 2020-09-18 michelle evans female 17 3363 25 de mayo phughes@hotmail.com +universidad del salvador ingeniería mecánica 2020-09-18 justin miller male 31 2177 bigand molinajames@hotmail.com +universidad del salvador actuario 2020-09-18 david michael male 23 7407 libano fosterjames@gmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-09-18 tanya maynard female 31 3474 chavarria whitejoel@yahoo.com +universidad del salvador licenciatura en artes 2020-09-18 stanley thomas male 19 3441 algarrobo sancheznicholas@yahoo.com +universidad del salvador actuario 2020-09-18 jacqueline lynch female 37 2177 bigand keith17@gmail.com +universidad del salvador licenciatura en producción de bioimagenes 2020-09-18 lori sanchez female 23 7003 aceilan gbrown@gmail.com +universidad del salvador licenciatura en ciencias ambientales 2020-09-18 gregory patel male 19 9301 el chalten robertmatthews@yahoo.com +universidad del salvador licenciatura en ciencias geológicas 2020-09-18 william rollins male 31 4643 antiguyos ariaspatricia@hotmail.com +universidad del salvador licenciatura en artes 2020-09-18 melissa christian female 39 2751 almacen castro smithjeffrey@hotmail.com +universidad del salvador licenciatura en administración 2020-09-18 jeremiah hernandez male 29 7501 indio rico william27@gmail.com +universidad del salvador diseño industrial 2020-09-18 debra zhang female 29 5600 agua de la mula jennifer21@yahoo.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-09-18 heather davidson female 17 5509 agrelo thuang@yahoo.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-09-19 richard reese male 39 5707 aguaditas sawyerkimberly@hotmail.com +universidad del salvador licenciatura en administración 2020-09-19 jose jackson male 24 5509 agrelo miguelmorgan@yahoo.com +universidad del salvador licenciatura en artes 2020-09-19 melissa rodriguez female 25 5367 cachiyuyal darlenehenry@gmail.com +universidad del salvador diseño de imagen y sonido 2020-09-19 sarah gallagher female 25 3204 ayui parada edwardhendricks@hotmail.com +universidad del salvador licenciatura en ciencias ambientales 2020-09-19 james thomas male 37 3016 san jose lynchscott@yahoo.com +universidad del salvador ingeniería en informática 2020-09-19 matthew bass male 39 3180 diego lopez jeffreymanning@yahoo.com +universidad del salvador contador público 2020-09-19 james carter male 25 7150 ayacucho pvaldez@hotmail.com +universidad del salvador diseño industrial 2020-09-19 stephanie hays female 27 1755 rafael castillo sawyerrobin@hotmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-09-19 michael peterson male 35 6244 banderalo andrewbarton@yahoo.com +universidad del salvador licenciatura en administración 2020-09-19 tara powell female 17 3526 gandolfi chelsea78@hotmail.com +universidad del salvador agronomía 2020-09-20 geoffrey shea male 25 3569 barros pazos millermonica@gmail.com +universidad del salvador ingeniería mecánica 2020-09-20 erik patterson male 21 3340 boqueron fisherphillip@hotmail.com +universidad del salvador farmacia 2020-09-20 james shields male 39 2709 los indios nproctor@hotmail.com +universidad del salvador contador público 2020-09-20 mark shaw male 27 3328 colonia japonesa erin47@yahoo.com +universidad del salvador contador público 2020-09-20 jorge gomez male 27 5551 estacion uspallata barbaramartinez@hotmail.com +universidad del salvador licenciatura en ciencia política 2020-09-20 joseph franklin male 35 2132 aero club rosario michellepreston@yahoo.com +universidad del salvador ciencias veterinarias 2020-09-20 justin pacheco male 29 5425 albarracin wilsonjennifer@gmail.com +universidad del salvador licenciatura en administración 2020-09-20 shawna watkins female 26 3234 bonpland jessestevenson@hotmail.com +universidad del salvador ingeniería electrónica 2020-09-20 christopher garcia male 39 5622 colonia jauregui donna62@yahoo.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-09-20 elizabeth moreno female 25 5460 agua de la zorra taylorlori@yahoo.com +universidad del salvador licenciatura en ciencias biológicas 2020-09-20 michael vasquez male 25 4723 alijilan jamesray@yahoo.com +universidad del salvador licenciatura en ciencias de la computación 2020-09-20 james campbell male 19 1900 la plata nburch@gmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-09-20 deborah reid female 25 6743 coliqueo xgriffin@gmail.com +universidad del salvador técnico para bioterios 2020-09-20 michael griffin male 17 7119 cari larquea sbrady@hotmail.com +universidad del salvador licenciatura en administración 2020-09-20 john johnson male 37 3229 colonia freitas btaylor@yahoo.com +universidad del salvador licenciatura en sociología 2020-09-20 edwin jackson male 17 3306 centinela andersonnatalie@hotmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-09-20 kathryn turner female 25 9051 aguada a pique dvillegas@yahoo.com +universidad del salvador bioquímica 2020-09-20 jennifer hawkins female 31 1834 temperley mary45@gmail.com +universidad del salvador licenciatura en relaciones del trabajo 2020-09-20 kelly taylor female 39 2713 manuel ocampo randallweber@gmail.com +universidad del salvador arquitectura 2020-09-20 mallory villarreal female 17 3302 aguara cua porterdave@yahoo.com +universidad del salvador ingeniería en informática 2020-09-21 brian morrison male 27 5750 alto de la leña patrick64@gmail.com +universidad del salvador actuario 2020-09-21 elizabeth navarro female 31 3231 colonia arocena ina dwest@hotmail.com +universidad del salvador licenciatura en ciencias geológicas 2020-09-21 elijah oneill male 27 5596 12 de octubre loganrobertson@gmail.com +universidad del salvador licenciatura en producción de bioimagenes 2020-09-21 jason johnson male 25 6338 leubuco steven06@gmail.com +universidad del salvador contador público 2020-09-21 nicole tyler female 37 1621 benavidez amycontreras@gmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-09-21 cheyenne solomon female 33 3381 maria magdalena zramirez@gmail.com +universidad del salvador licenciatura en ciencias ambientales 2020-09-21 hector sherman male 23 3328 colonia japonesa ebailey@yahoo.com +universidad del salvador licenciatura en ciencias de la computación 2020-09-21 james harvey male 25 6013 baigorrita fergusonbrandon@hotmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-09-21 kimberly lane female 27 4155 cevil grande dickersonjames@hotmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-09-21 jessica adams female 31 4751 agua de dionisio ericmonroe@hotmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-09-21 maria evans female 24 2520 la california jennifer35@hotmail.com +universidad del salvador ciencias veterinarias 2020-09-22 michelle walsh female 23 8172 arroyo corto jessicanewman@hotmail.com +universidad del salvador diseño industrial 2020-09-22 russell roberts male 37 5883 alto lindo debra58@gmail.com +universidad del salvador licenciatura en ciencias geológicas 2020-09-22 sherri thomas female 21 4753 corralito marklynch@gmail.com +universidad del salvador ciencias veterinarias 2020-09-22 jessica james female 37 2138 carcaraña vincentjoel@yahoo.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-09-22 kristin baxter female 25 2317 casablanca qhanson@gmail.com +universidad del salvador licenciatura en ciencias de la educación 2020-09-23 elijah murphy male 21 3280 arroyo urquiza dmiller@hotmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-09-23 michael williams male 25 7313 16 de julio ihickman@gmail.com +universidad del salvador farmacia 2020-09-23 john owens male 25 5565 campo de los andes echristian@hotmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-09-23 bethany mccall female 21 5719 agua amarga howarddenise@yahoo.com +universidad del salvador ingeniería electrónica 2020-09-23 benjamin parker male 25 9050 gobernador moyano dominguezkristina@gmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-09-23 tamara carrillo female 27 8375 cañadon de los indios kyoung@hotmail.com +universidad del salvador licenciatura en artes 2020-09-23 lisa malone female 39 9103 bajo de los huesos zbrown@hotmail.com +universidad del salvador diseño de imagen y sonido 2020-09-23 gregory collins male 25 4145 ingenio la providencia haleykevin@hotmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-09-23 tracy miller female 35 8185 campo del norte americano christinemccoy@yahoo.com +universidad del salvador licenciatura en producción de bioimagenes 2020-09-23 janet gomez female 23 1862 america unida cheryl42@yahoo.com +universidad del salvador licenciatura en ciencias de la educación 2020-09-23 karen moore female 27 6385 arata zsmith@hotmail.com +universidad del salvador licenciatura en ciencias biológicas 2020-09-23 martin cobb male 27 5710 la punta rebeccagordon@hotmail.com +universidad del salvador licenciatura en administración 2020-09-23 william fowler male 27 3557 caraguatay georgemiles@hotmail.com +universidad del salvador actuario 2020-09-23 michael ortega male 39 1605 carapachay wrightlisa@hotmail.com +universidad del salvador licenciatura en ciencia política 2020-09-23 rodney wilkerson male 31 3371 cabure johncannon@gmail.com +universidad del salvador licenciatura en ciencias ambientales 2020-09-24 tara mcgee female 31 3476 el remanso ggarcia@yahoo.com +universidad del salvador licenciatura en ciencias biológicas 2020-09-24 kevin austin male 37 3412 albardon evan49@gmail.com +universidad del salvador licenciatura en administración 2020-09-24 deanna sanchez female 29 8144 colonia monte la plata qmartinez@gmail.com +universidad del salvador farmacia 2020-09-24 jeffrey miller male 19 6058 pazos kanki rachel07@yahoo.com +universidad del salvador licenciatura en ciencias de la educación 2020-09-24 gina thomas female 33 1768 ciudad madero rogersmatthew@gmail.com +universidad del salvador licenciatura en psicología 2020-09-24 brent weeks male 25 5421 la tranca debbieayala@yahoo.com +universidad del salvador farmacia 2020-09-24 rickey griffith male 23 8418 anecon chico kmay@yahoo.com +universidad del salvador diseño de imagen y sonido 2020-09-24 andrea reid female 31 1905 jose ferrari johnrichards@gmail.com +universidad del salvador arquitectura 2020-09-24 karl kelly male 26 1822 valentin alsina garymoore@gmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-09-24 vickie williams female 29 6062 coronel granada meganferguson@gmail.com +universidad del salvador agronomía 2020-09-24 kimberly davila female 27 3515 capitan solari williamskara@hotmail.com +universidad del salvador arquitectura 2020-09-24 kevin burton male 39 6015 campo coliqueo owolfe@hotmail.com +universidad del salvador licenciatura en ciencia política 2020-09-24 james burns male 23 2119 arminda walvarado@yahoo.com +universidad del salvador licenciatura en ciencias antropológicas 2020-09-24 grace velasquez female 26 3302 aguara cua gallegosjim@yahoo.com +universidad del salvador licenciatura en relaciones del trabajo 2020-09-24 francis glover male 33 6214 casimiro gomez mooresteven@yahoo.com +universidad del salvador licenciatura en artes 2020-09-24 christine reed female 22 4117 alabama nancy29@yahoo.com +universidad del salvador diseño de imagen y sonido 2020-09-24 robert weaver male 23 6389 alegria rileykaren@hotmail.com +universidad del salvador licenciatura en ciencias biológicas 2020-09-24 ryan landry male 39 6705 villa ruiz qperkins@hotmail.com +universidad del salvador actuario 2020-09-24 lee reed male 25 1919 base aeronaval punta indio frank33@gmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-09-25 william fry male 37 3216 arroyo hondo rebecca24@hotmail.com +universidad del salvador bioquímica 2020-09-25 tracy carey female 25 6725 carmen de areco romanlee@gmail.com +universidad del salvador ciencias veterinarias 2020-09-25 tiffany stevens female 21 7500 el carretero urussell@gmail.com +universidad del salvador farmacia 2020-09-25 rebecca johnson female 35 6311 campo de los toros marshallanthony@hotmail.com +universidad del salvador farmacia 2020-09-25 jasmine johnston female 21 3061 antonio pini jennifer65@yahoo.com +universidad del salvador licenciatura en ciencias antropológicas 2020-09-25 jennifer hudson female 18 3050 calchaqui andre87@yahoo.com +universidad del salvador licenciatura en producción de bioimagenes 2020-09-25 ian goodman male 35 2812 capilla del señor jessica98@yahoo.com +universidad del salvador licenciatura en ciencias biológicas 2020-09-25 joyce campbell female 19 2609 colonia morgan dianedominguez@gmail.com +universidad del salvador ciencias veterinarias 2020-09-25 craig morgan male 26 1655 jose leon suarez jacqueline43@gmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-09-25 karen hamilton female 18 5871 la aguada de las animas timothyberry@yahoo.com +universidad del salvador licenciatura en relaciones del trabajo 2020-09-25 james bradley male 33 1731 villars matthew74@yahoo.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-09-26 james roy male 35 7515 claudio c molina jacobsmith@gmail.com +universidad del salvador ingeniería electrónica 2020-09-26 daniel mullins male 17 9217 cholila troycharles@hotmail.com +universidad del salvador medicina 2020-09-26 kelsey brown female 37 2802 lomas del rio lujan avilajoseph@gmail.com +universidad del salvador licenciatura en ciencias biológicas 2020-09-26 charles alvarado male 25 1881 san francisco solano qparsons@gmail.com +universidad del salvador licenciatura en musicoterapia 2020-09-26 jessica johns female 39 6311 campo de los toros kmullins@hotmail.com +universidad del salvador agronomía 2020-09-26 carol morton female 29 4152 aguilares lawsonleslie@hotmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-09-26 teresa rowland female 26 6230 francisco casal rmorgan@hotmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-09-26 rachel jackson female 25 2637 colonia hansen saragardner@hotmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-09-26 joshua richards male 21 8532 arroyo salado osherman@gmail.com +universidad del salvador contador público 2020-09-26 holly sanchez female 35 5300 amilgancho patrick50@yahoo.com +universidad del salvador medicina 2020-09-26 victoria crawford female 39 2216 campo raffo angela58@yahoo.com +universidad del salvador licenciatura en musicoterapia 2020-09-26 heather richardson female 24 9311 cañadon leon pamelamayer@gmail.com +universidad del salvador licenciatura en ciencias de la educación 2020-09-27 jesus rowe male 25 3027 la pelada mcooper@hotmail.com +universidad del salvador agronomía 2020-09-27 christian ross male 35 1847 rafael calzada tracie62@yahoo.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-09-27 joseph baldwin male 21 9221 valle hondo harringtonjordan@hotmail.com +universidad del salvador licenciatura en administración 2020-09-27 cynthia lee female 23 7260 barrio villa saladillo castrojamie@yahoo.com +universidad del salvador licenciatura en ciencias de la educación 2020-09-27 david garcia male 23 3485 carandaiti lisaroach@hotmail.com +universidad del salvador diseño de imagen y sonido 2020-09-27 stephen woodard male 21 7212 doctor domingo harosteguy floreschristopher@hotmail.com +universidad del salvador licenciatura en musicoterapia 2020-09-27 christina boone female 19 1802 aeropuerto ezeiza bettymckay@hotmail.com +universidad del salvador licenciatura en psicología 2020-09-27 christopher madden male 25 5555 puente del inca nicholasmontgomery@yahoo.com +universidad del salvador licenciatura en ciencias de la computación 2020-09-27 bobby lopez male 21 1814 barrio 1 de mayo andersonstephanie@hotmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-09-27 jennifer sharp female 33 3363 25 de mayo onealnicole@gmail.com +universidad del salvador actuario 2020-09-27 melissa ward female 39 3164 colonia rivas whitakerkatherine@hotmail.com +universidad del salvador arquitectura 2020-09-27 haley williams female 39 8508 ambrosio p lezica mcguirekaren@gmail.com +universidad del salvador licenciatura en ciencias biológicas 2020-09-28 courtney bailey female 37 4178 abra rica joseph58@hotmail.com +universidad del salvador bioquímica 2020-09-28 john harris male 21 6535 bellocq bryancarmen@gmail.com +universidad del salvador actuario 2020-09-28 brian rojas male 24 8203 la chirlandia sharonmccarty@yahoo.com +universidad del salvador licenciatura en ciencias antropológicas 2020-09-28 jonathan ochoa male 26 1774 la salada christymoody@hotmail.com +universidad del salvador licenciatura en ciencias de la educación 2020-09-28 claire lucas female 21 4751 agua de dionisio woodslisa@hotmail.com +universidad del salvador contador público 2020-09-28 william cunningham male 19 8424 aguada de guerra nicole75@gmail.com +universidad del salvador medicina 2020-09-28 daniel reid male 35 2718 lierra adjemiro ygonzalez@yahoo.com +universidad del salvador licenciatura en ciencias geológicas 2020-09-28 daniel evans male 21 7307 crotto maxwellteresa@hotmail.com +universidad del salvador ingeniería electrónica 2020-09-28 tammy king female 24 7241 la porteña carrillomary@yahoo.com +universidad del salvador licenciatura en psicología 2020-09-28 andrew sullivan male 29 5715 arbol verde kimberlyschneider@hotmail.com +universidad del salvador licenciatura en ciencias de la educación 2020-09-28 eric hernandez male 25 3081 cavour chickman@gmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-09-28 stephanie richardson female 29 3338 17 de agosto julialopez@yahoo.com +universidad del salvador licenciatura en relaciones del trabajo 2020-09-28 christine rubio female 29 3216 arroyo hondo jasonrobinson@gmail.com +universidad del salvador ingeniería electrónica 2020-09-29 matthew bolton male 21 8328 allen thomasobrien@yahoo.com +universidad del salvador licenciatura en artes 2020-09-29 daisy tyler female 27 2322 cabaña el cisne rodney66@gmail.com +universidad del salvador licenciatura en sociología 2020-09-29 michelle wade female 25 6703 alastuey klewis@gmail.com +universidad del salvador diseño industrial 2020-09-29 michael dominguez male 27 4234 achalco donnaperez@gmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-09-29 traci juarez female 29 4634 abralaite grimescynthia@gmail.com +universidad del salvador ingeniería en informática 2020-09-29 brittney sparks female 33 4651 agua de castilla ericabowers@gmail.com +universidad del salvador licenciatura en ciencias geológicas 2020-09-29 valerie maynard female 29 9421 frigorifico cap fowlererik@yahoo.com +universidad del salvador ingeniería en informática 2020-09-29 brittney cole female 37 7135 comandante giribone jamesmayer@yahoo.com +universidad del salvador licenciatura en ciencias ambientales 2020-09-29 monica farley female 17 2105 cañada rica maria48@yahoo.com +universidad del salvador licenciatura en relaciones del trabajo 2020-09-29 john flores male 27 8353 aguada chacay co churchmiguel@gmail.com +universidad del salvador licenciatura en ciencias de la educación 2020-09-29 kevin boyle male 24 9039 hito 45 nbradford@hotmail.com +universidad del salvador ingeniería electrónica 2020-09-29 carl washington male 35 5703 6 de septiembre foxmichael@gmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-09-29 todd frazier male 27 5582 alberto flores amyneal@gmail.com +universidad del salvador técnico para bioterios 2020-09-29 tracy montgomery female 25 2909 estancias keithhernandez@gmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-09-29 lori anderson female 39 7403 alvaro barros rachelreynolds@hotmail.com +universidad del salvador actuario 2020-09-30 jennifer zuniga female 17 5474 barranquitas vincentlaura@gmail.com +universidad del salvador licenciatura en musicoterapia 2020-09-30 jessica wilson female 17 6062 coronel granada gpage@yahoo.com +universidad del salvador contador público 2020-09-30 ronnie sanders male 31 7207 el trigo karayates@yahoo.com +universidad del salvador licenciatura en ciencias biológicas 2020-09-30 yvonne johnson female 19 7020 benito juarez mcdonaldaaron@gmail.com +universidad del salvador contador público 2020-09-30 hannah hall female 39 5569 aguada heather32@gmail.com +universidad del salvador agronomía 2020-09-30 jennifer ray female 37 6034 colonia alberdi david54@yahoo.com +universidad del salvador técnico para bioterios 2020-09-30 meghan smith female 33 2505 campo la riviere rtaylor@yahoo.com +universidad del salvador licenciatura en musicoterapia 2020-09-30 dale patel male 19 2707 4 de noviembre eduke@hotmail.com +universidad del salvador licenciatura en psicología 2020-09-30 daniel cohen male 35 2305 lehmann franksmith@hotmail.com +universidad del salvador ingeniería electrónica 2020-10-01 ryan carlson male 25 2705 haras san jacinto jromero@gmail.com +universidad del salvador licenciatura en ciencias geológicas 2020-10-01 grant ruiz male 17 9013 cañadon seco weaverbarbara@gmail.com +universidad del salvador licenciatura en psicología 2020-10-01 erica nelson female 17 4149 alpachiri anthony24@yahoo.com +universidad del salvador licenciatura en administración 2020-10-01 karen gamble female 33 2173 campo pesoa stephanieberry@yahoo.com +universidad del salvador licenciatura en relaciones del trabajo 2020-10-01 christopher russell male 17 6535 bellocq pattersonjeremy@gmail.com +universidad del salvador licenciatura en artes 2020-10-01 anthony kennedy male 18 2204 jesus maria alexandra42@gmail.com +universidad del salvador diseño de imagen y sonido 2020-10-01 jeffrey smith male 39 3014 angel gallardo ztaylor@gmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-10-01 laura riddle female 17 6475 esteban de luca joshuarivera@hotmail.com +universidad del salvador ingeniería electrónica 2020-10-01 madeline carson female 24 6348 bocayuba christopher85@yahoo.com +universidad del salvador licenciatura en ciencia política 2020-10-01 anna lowe female 18 8349 aguas de las mulas ohunt@yahoo.com +universidad del salvador diseño industrial 2020-10-01 angela nguyen female 29 8532 arroyo salado megan93@gmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-10-01 joshua spears male 37 6077 encina psanders@hotmail.com +universidad del salvador licenciatura en sociología 2020-10-01 regina briggs female 23 9200 arroyo pescado katelyn31@gmail.com +universidad del salvador actuario 2020-10-01 david brown male 24 6032 blandengues carterkeith@hotmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-10-01 jessica santiago female 29 4149 alpachiri dawn33@yahoo.com +universidad del salvador licenciatura en ciencias de la educación 2020-10-02 melissa ross female 31 3705 10 de mayo william11@gmail.com +universidad del salvador licenciatura en psicología 2020-10-02 heather williams female 37 4147 alto las lechuzas cherylchan@gmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-10-02 kevin harmon male 27 6317 la florencia bishoppatrick@hotmail.com +universidad del salvador licenciatura en musicoterapia 2020-10-02 christina gutierrez female 22 4184 bustamante smithmelanie@hotmail.com +universidad del salvador contador público 2020-10-02 gary hays male 23 5473 aguayo danielmendoza@hotmail.com +universidad del salvador licenciatura en ciencia política 2020-10-02 kristi cherry female 37 1875 wilde zrivera@gmail.com +universidad del salvador agronomía 2020-10-02 stephanie martin female 25 2340 ceres nsanchez@yahoo.com +universidad del salvador licenciatura en relaciones del trabajo 2020-10-02 andrew mullins male 21 3555 campo huber millerluis@yahoo.com +universidad del salvador licenciatura en terapia ocupacional 2020-10-02 craig austin male 25 9033 aldea apeleg hernandezrebecca@hotmail.com +universidad del salvador licenciatura en ciencias ambientales 2020-10-02 justin howell male 35 5771 alanices crystaltaylor@gmail.com +universidad del salvador licenciatura en administración 2020-10-02 heather miller female 19 3328 colonia japonesa courtneygonzalez@gmail.com +universidad del salvador diseño de imagen y sonido 2020-10-02 dustin wilson male 35 1875 wilde kfrye@hotmail.com +universidad del salvador licenciatura en ciencia política 2020-10-02 wesley horne male 29 3536 bocas xarcher@yahoo.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-10-02 matthew moody male 23 2637 colonia hansen gonzalezkelsey@hotmail.com +universidad del salvador licenciatura en ciencias ambientales 2020-10-03 katie saunders female 29 2806 las palmas ofreeman@yahoo.com +universidad del salvador licenciatura en musicoterapia 2020-10-03 nicole stewart female 26 5359 alto jaguel collinspaul@gmail.com +universidad del salvador bioquímica 2020-10-03 timothy townsend male 23 2453 carlos pellegrini john38@gmail.com +universidad del salvador ciencias veterinarias 2020-10-03 brian reynolds male 19 5401 barrio el tontal matthewadams@hotmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-10-03 marie mason female 33 6305 atreuco danielflowers@yahoo.com +universidad del salvador medicina 2020-10-03 ryan reyes male 23 4195 7 de abril andradeapril@gmail.com +universidad del salvador ingeniería mecánica 2020-10-03 sarah roach female 35 8431 el hoyo haroldadams@yahoo.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-10-03 joseph clark male 33 7103 faro san antonio mooremark@yahoo.com +universidad del salvador licenciatura en ciencias antropológicas 2020-10-03 kevin carpenter male 31 4651 agua de castilla lopezcatherine@gmail.com +universidad del salvador licenciatura en ciencias geológicas 2020-10-04 rebecca berry female 27 1895 arturo segui bhamilton@gmail.com +universidad del salvador licenciatura en producción de bioimagenes 2020-10-04 benjamin petersen male 17 4724 agua colorada jeffreyyoung@yahoo.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-10-04 jean kelly female 33 8308 villa manzano qlewis@yahoo.com +universidad del salvador ingeniería en informática 2020-10-04 steven martin male 19 9105 angostura benjaminanderson@yahoo.com +universidad del salvador licenciatura en ciencias de la computación 2020-10-04 allison riley female 37 2000 villa angelica amy77@gmail.com +universidad del salvador licenciatura en musicoterapia 2020-10-04 anthony king male 21 1905 jose ferrari jshelton@yahoo.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-10-04 joseph kent male 39 2113 peyrano brandonmccormick@hotmail.com +universidad del salvador diseño industrial 2020-10-04 natasha matthews female 31 2903 erezcano changstephanie@gmail.com +universidad del salvador licenciatura en producción de bioimagenes 2020-10-04 joshua perez male 39 7639 cooper tchristian@gmail.com +universidad del salvador licenciatura en relaciones del trabajo 2020-10-04 tony johnson male 25 2705 haras san jacinto garciavincent@yahoo.com +universidad del salvador actuario 2020-10-04 robin grant female 23 9020 arroyo quilla charlesedwards@hotmail.com +universidad del salvador licenciatura en ciencias de la educación 2020-10-04 robert hernandez male 18 5594 alto con zampa wrightleonard@hotmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-10-04 john gray male 26 1631 villa rosa boonepreston@gmail.com +universidad del salvador licenciatura en ciencias biológicas 2020-10-05 ashley brown female 19 2637 colonia hansen robertsrobert@yahoo.com +universidad del salvador agronomía 2020-10-05 pamela phillips female 37 4700 banda varela mpope@gmail.com +universidad del salvador ingeniería mecánica 2020-10-05 jonathan orozco male 19 3405 algarrobal puisoye nicole35@hotmail.com +universidad del salvador licenciatura en musicoterapia 2020-10-05 sean davis male 26 4149 alpachiri jelliott@yahoo.com +universidad del salvador licenciatura en ciencias de la educación 2020-10-05 jose hicks male 21 7403 alvaro barros andersonandrew@yahoo.com +universidad del salvador ingeniería mecánica 2020-10-05 tom rose male 29 6237 america elizabethwoods@hotmail.com +universidad del salvador licenciatura en ciencias ambientales 2020-10-05 lisa gonzalez female 25 5415 angaco norte millerjonathon@gmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-10-05 roberto black male 35 1913 atalaya djackson@hotmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-10-05 shannon jones female 21 2942 baradero johnsonanthony@yahoo.com +universidad del salvador licenciatura en administración 2020-10-05 michael gonzalez male 33 3240 colonia egido atkinsoncharles@hotmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-10-05 victor white male 33 8364 chimpay campbellashley@yahoo.com +universidad del salvador ingeniería en informática 2020-10-05 patrick jackson male 23 2132 aero club rosario deanna37@yahoo.com +universidad del salvador técnico para bioterios 2020-10-05 joseph mcguire male 39 7318 colonia hinojo dawn77@yahoo.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-10-06 emma ball female 25 1806 tristan suarez zbuckley@hotmail.com +universidad del salvador diseño de imagen y sonido 2020-10-06 courtney kirk female 23 2142 campo medina mbrewer@gmail.com +universidad del salvador diseño de imagen y sonido 2020-10-06 amy wallace female 23 3372 cataratas del iguazu davidhess@hotmail.com +universidad del salvador licenciatura en artes 2020-10-06 noah harris male 25 3218 arroyo palmar osummers@gmail.com +universidad del salvador licenciatura en administración 2020-10-06 brenda walker female 35 3285 berduc shepherdcarl@gmail.com +universidad del salvador ingeniería en informática 2020-10-06 chad booker male 26 5525 buena vista jennifersanchez@gmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-10-07 debbie holden female 25 5883 alto lindo turnerpamela@gmail.com +universidad del salvador técnico para bioterios 2020-10-07 sherry gonzalez female 33 3445 9 de julio afleming@hotmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-10-07 mary perez female 18 4741 agua de las palomas virginiaroberts@hotmail.com +universidad del salvador ciencias veterinarias 2020-10-07 kylie reyes female 19 8333 aguada guzman christopherrivera@gmail.com +universidad del salvador ingeniería en informática 2020-10-07 jesse rodriguez male 23 2613 la morocha urangel@hotmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-10-07 susan fuller female 19 5571 chivilcoy regina66@yahoo.com +universidad del salvador licenciatura en ciencias antropológicas 2020-10-07 anthony garner male 31 7519 san mayol josephdavis@hotmail.com +universidad del salvador licenciatura en musicoterapia 2020-10-07 hector garza male 39 1646 san fernando tracymorales@yahoo.com +universidad del salvador diseño industrial 2020-10-07 andrew beltran male 31 8206 colonia españa barbaraortiz@hotmail.com +universidad del salvador licenciatura en artes 2020-10-07 john romero male 21 7160 la union sbarber@yahoo.com +universidad del salvador ciencias veterinarias 2020-10-07 angelica hoffman female 19 8409 puerto ojo de agua mboyd@hotmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-10-07 maureen long female 25 3466 abalo nathaniel42@hotmail.com +universidad del salvador licenciatura en psicología 2020-10-08 sheri quinn female 24 7519 san mayol derek21@gmail.com +universidad del salvador contador público 2020-10-08 matthew cole male 27 3565 arroyo del rey thomascynthia@yahoo.com +universidad del salvador licenciatura en ciencias geológicas 2020-10-08 pamela mann female 26 3530 aldea forestal camposamber@yahoo.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-10-08 steven hardy male 25 7208 coronel boerr darrelljimenez@yahoo.com +universidad del salvador ingeniería en informática 2020-10-08 dwayne dennis male 29 3260 arroyo molino robertsonmorgan@hotmail.com +universidad del salvador licenciatura en ciencias geológicas 2020-10-08 brian foley male 25 3170 alberto gerchunoff traci74@gmail.com +universidad del salvador diseño de imagen y sonido 2020-10-08 shawn richardson male 20 8503 chocori ramirezgina@yahoo.com +universidad del salvador arquitectura 2020-10-08 curtis nguyen male 19 2301 bella italia jacksoncrystal@hotmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-10-08 susan leblanc female 27 5425 albarracin mmorales@yahoo.com +universidad del salvador licenciatura en relaciones del trabajo 2020-10-08 james martin male 25 1931 punta lara janice49@gmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-10-08 taylor mcmahon female 23 3016 san jose jonesjenna@hotmail.com +universidad del salvador ciencias veterinarias 2020-10-09 jacob hickman male 21 7228 abbott andersonmelissa@gmail.com +universidad del salvador medicina 2020-10-09 jacob thomas male 37 4724 agua colorada paul06@gmail.com +universidad del salvador contador público 2020-10-09 jessica jones female 31 3280 arroyo urquiza mcbridejohn@gmail.com +universidad del salvador diseño de imagen y sonido 2020-10-09 jennifer beck female 23 7107 santa teresita hatfieldjohnathan@gmail.com +universidad del salvador licenciatura en ciencia política 2020-10-09 lisa foster female 29 6660 25 de mayo ipotter@hotmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-10-10 david mason male 33 2326 bealistock gabrielle52@gmail.com +universidad del salvador licenciatura en administración 2020-10-10 tyler kerr male 31 3076 huanqueros colemelissa@gmail.com +universidad del salvador agronomía 2020-10-10 william rogers male 21 3372 cataratas del iguazu blake61@yahoo.com +universidad del salvador ciencias veterinarias 2020-10-10 brandon jones male 29 1894 juan vucetich ex dr r levene ismith@hotmail.com +universidad del salvador licenciatura en ciencias ambientales 2020-10-10 justin gardner male 31 3446 kilometro 374 abrown@gmail.com +universidad del salvador licenciatura en sociología 2020-10-10 steven scott male 23 5351 banda florida youngshelby@yahoo.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-10-10 thomas wilson male 35 7313 16 de julio jodysmith@hotmail.com +universidad del salvador farmacia 2020-10-10 amber smith female 33 6361 agustoni steelejohn@hotmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-10-10 marc morrow male 17 1832 lomas de zamora karina37@yahoo.com +universidad del salvador licenciatura en ciencia política 2020-10-10 carl baldwin male 23 8319 campamento sol robertvaldez@gmail.com +universidad del salvador licenciatura en ciencias de la educación 2020-10-10 dennis simpson male 22 8144 colonia monte la plata ingramdonald@gmail.com +universidad del salvador actuario 2020-10-10 robin rowland female 33 3177 altamirano norte ashleybrown@hotmail.com +universidad del salvador ingeniería electrónica 2020-10-11 richard jones male 29 2630 firmat teresa84@yahoo.com +universidad del salvador licenciatura en ciencias biológicas 2020-10-11 anthony watkins male 25 5521 los corredores dmurray@hotmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-10-11 daniel hernandez male 39 3474 chavarria jimchavez@hotmail.com +universidad del salvador licenciatura en ciencia política 2020-10-11 dawn saunders female 33 5341 anillaco christopher56@hotmail.com +universidad del salvador ingeniería electrónica 2020-10-11 michael spencer male 17 7130 caminera samborombon jack76@gmail.com +universidad del salvador arquitectura 2020-10-11 michael lamb male 31 1737 kilometro 77 rachel86@hotmail.com +universidad del salvador farmacia 2020-10-11 paul thomas male 31 7020 benito juarez ndeleon@hotmail.com +universidad del salvador técnico para bioterios 2020-10-11 tara collins female 31 1852 burzaco oflores@yahoo.com +universidad del salvador licenciatura en psicología 2020-10-11 brian howard male 33 3234 bonpland sue21@hotmail.com +universidad del salvador licenciatura en ciencias ambientales 2020-10-11 andrew sullivan male 17 1746 francisco alvarez omarvasquez@yahoo.com +universidad del salvador licenciatura en ciencias biológicas 2020-10-11 hayden jennings male 21 3054 colonia la negra juliajohnson@gmail.com +universidad del salvador diseño de imagen y sonido 2020-10-11 steven keith male 33 2931 isla los laureles patricia80@yahoo.com +universidad del salvador actuario 2020-10-11 julia webb female 37 2946 el espinillo dlee@hotmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-10-11 jeffrey houston male 35 3214 estacion yerua deborah60@gmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-10-11 james dougherty male 19 5523 buena nueva dennisconway@yahoo.com +universidad del salvador técnico para bioterios 2020-10-11 zachary brown male 37 8117 alferez san martin travishouston@yahoo.com +universidad del salvador farmacia 2020-10-11 kimberly diaz female 19 8417 cañadon chileno david99@gmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-10-12 bonnie mathews female 27 6333 alfredo peña curtisparker@yahoo.com +universidad del salvador ingeniería en informática 2020-10-12 rachael richardson female 31 5557 caracoles walkerjames@yahoo.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-10-12 ricky reese male 31 5531 barrio ferri hashley@gmail.com +universidad del salvador licenciatura en psicología 2020-10-12 ann alvarez female 19 7603 comandante nicanor otamendi khanlisa@gmail.com +universidad del salvador ingeniería en informática 2020-10-12 ricky delgado male 26 1763 virrey del pino justinchavez@yahoo.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-10-12 jason meyer male 37 1849 claypole clewis@hotmail.com +universidad del salvador licenciatura en artes 2020-10-12 timothy johnston male 23 1911 bme bavio gral mansilla ryan49@gmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-10-12 katherine bond female 19 6608 agote iandrade@gmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-10-12 howard andrade male 37 2813 arroyo de la cruz markhill@gmail.com +universidad del salvador farmacia 2020-10-12 tiffany ellis female 27 3046 arrascaeta rogerslisa@hotmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-10-12 ricky king male 25 8353 aguada chacay co paynesarah@gmail.com +universidad del salvador licenciatura en administración 2020-10-12 sean miller male 19 7220 funke russellbryan@hotmail.com +universidad del salvador licenciatura en musicoterapia 2020-10-12 kimberly brown female 25 4129 cañada xhahn@hotmail.com +universidad del salvador agronomía 2020-10-12 michael thompson male 24 3382 colonia cunci qjohnson@hotmail.com +universidad del salvador licenciatura en ciencia política 2020-10-12 kenneth lynn male 18 5383 agua colorada theresamunoz@gmail.com +universidad del salvador licenciatura en musicoterapia 2020-10-12 brian buckley male 24 2607 campo quirno browningchristopher@gmail.com +universidad del salvador licenciatura en ciencias geológicas 2020-10-12 timothy graves male 17 4158 campo de talamayo terri10@yahoo.com +universidad del salvador licenciatura en producción de bioimagenes 2020-10-13 logan thomas male 33 3472 caaguazu pclark@yahoo.com +universidad del salvador contador público 2020-10-13 brian charles male 21 4122 alizal vthomas@gmail.com +universidad del salvador ingeniería mecánica 2020-10-13 kimberly wiggins female 27 3569 barros pazos andrewrandolph@gmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-10-13 gina stevens female 19 2324 colonia tacurales jasmine29@hotmail.com +universidad del salvador licenciatura en administración 2020-10-13 edwin esparza male 19 7633 maori qfarmer@hotmail.com +universidad del salvador licenciatura en artes 2020-10-13 william barajas male 39 3569 barros pazos randyoneill@gmail.com +universidad del salvador licenciatura en artes 2020-10-13 jennifer clark female 33 3267 cañada de las ovejas yjones@yahoo.com +universidad del salvador técnico para bioterios 2020-10-13 tiffany jensen female 27 6235 villa sauce wshelton@hotmail.com +universidad del salvador contador público 2020-10-13 tiffany martinez female 23 3400 bañado norte cross@hotmail.com +universidad del salvador ingeniería en informática 2020-10-13 steven clements male 39 4701 acostilla katherinevega@yahoo.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-10-13 ronald gould male 31 2743 arroyo dulce qmann@yahoo.com +universidad del salvador farmacia 2020-10-13 vincent hill male 35 3372 cataratas del iguazu hannahcollins@gmail.com +universidad del salvador diseño de imagen y sonido 2020-10-13 james moreno male 33 3362 1 de mayo sandrareynolds@yahoo.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-10-13 kara white female 33 6471 atahualpa tpowers@gmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-10-13 danielle wood female 24 4122 alizal hkeller@yahoo.com +universidad del salvador licenciatura en relaciones del trabajo 2020-10-13 stephanie peters female 37 8132 balneario chapalco stephenrivera@yahoo.com +universidad del salvador bioquímica 2020-10-14 luis allen male 21 3240 colonia egido ycohen@hotmail.com +universidad del salvador técnico para bioterios 2020-10-14 karen grant female 29 3134 antonio tomas sud isaiahcontreras@yahoo.com +universidad del salvador contador público 2020-10-14 jenny zimmerman female 35 5473 aguayo rwilson@gmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-10-14 chad rocha male 25 3712 los frentones john25@hotmail.com +universidad del salvador licenciatura en musicoterapia 2020-10-14 juan miller male 19 8417 cañadon chileno eric77@yahoo.com +universidad del salvador diseño de imagen y sonido 2020-10-14 margaret moore female 25 3561 avellaneda browncatherine@yahoo.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-10-14 connor strickland male 18 1893 centro agricola el pato baldwinalyssa@yahoo.com +universidad del salvador bioquímica 2020-10-14 gail walker female 35 2445 cristolia uchung@gmail.com +universidad del salvador diseño industrial 2020-10-14 cassandra steele female 24 7612 camet vanderson@hotmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-10-14 matthew harrison male 29 1925 destileria fiscal kirbymichael@gmail.com +universidad del salvador licenciatura en ciencias biológicas 2020-10-14 brianna massey female 31 5474 barranquitas kelly33@hotmail.com +universidad del salvador diseño industrial 2020-10-14 david hall male 23 3200 colonia los sauces camachojessica@gmail.com +universidad del salvador licenciatura en ciencias de la educación 2020-10-14 miguel hester male 17 3526 gandolfi anthonybarber@hotmail.com +universidad del salvador licenciatura en administración 2020-10-14 kimberly alexander female 29 8508 ambrosio p lezica jweeks@hotmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-10-14 chelsey durham female 17 6034 colonia alberdi roblesthomas@gmail.com +universidad del salvador ingeniería mecánica 2020-10-14 janet martin female 19 2523 bouquet gsanders@hotmail.com +universidad del salvador ingeniería mecánica 2020-10-14 angela stokes female 23 5584 barrio villa adela baxtermichael@hotmail.com +universidad del salvador ingeniería en informática 2020-10-14 shelley cooper female 35 2938 alsina jmcguire@hotmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-10-14 corey jimenez male 37 6279 batavia harrisonanthony@yahoo.com +universidad del salvador licenciatura en administración 2020-10-14 tracy cole male 19 3620 kilometro 184 caldwelljennifer@yahoo.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-10-14 kaylee smith female 37 3164 colonia rivas simsemily@gmail.com +universidad del salvador licenciatura en artes 2020-10-15 pamela gonzalez female 17 5446 balde de leyes jennifer84@gmail.com +universidad del salvador bioquímica 2020-10-15 christine flores female 27 9409 isla gran malvina hollyellison@hotmail.com +universidad del salvador agronomía 2020-10-15 nancy gardner female 25 6725 carmen de areco jason02@yahoo.com +universidad del salvador licenciatura en administración 2020-10-15 melinda shelton female 25 7620 balcarce brownmegan@hotmail.com +universidad del salvador licenciatura en musicoterapia 2020-10-15 jill smith female 27 1852 burzaco johnsimmons@yahoo.com +universidad del salvador licenciatura en ciencias ambientales 2020-10-15 michael brown male 29 2804 campana dennis56@gmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-10-15 michael anderson male 21 6509 del valle lambdonna@yahoo.com +universidad del salvador licenciatura en ciencias antropológicas 2020-10-15 victoria cole female 39 5543 3 de mayo jamesjoshua@hotmail.com +universidad del salvador diseño industrial 2020-10-15 john parker male 37 7207 el trigo eweiss@yahoo.com +universidad del salvador arquitectura 2020-10-15 malik henry male 33 3144 alcaraz 1ro foxcarl@gmail.com +universidad del salvador ingeniería mecánica 2020-10-15 chad benson male 23 2252 colonia campo piaggio daniel70@hotmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-10-15 nancy diaz female 27 6380 boeuf stanley99@gmail.com +universidad del salvador licenciatura en relaciones del trabajo 2020-10-16 nicholas wood male 27 9120 bahia cracher lucasdouglas@gmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-10-16 jessica floyd female 23 3244 colonia belga americana valenciajulie@gmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-10-16 joshua ray male 17 3045 campo zavalla matthewmarshall@hotmail.com +universidad del salvador farmacia 2020-10-16 catherine galvan female 19 4612 carahunco emilysmith@gmail.com +universidad del salvador técnico para bioterios 2020-10-16 diane larsen female 31 1650 general san martin fmontgomery@hotmail.com +universidad del salvador técnico para bioterios 2020-10-16 troy avery male 27 8175 goyena omcintyre@gmail.com +universidad del salvador actuario 2020-10-16 crystal campos female 26 3466 abalo websterdon@gmail.com +universidad del salvador farmacia 2020-10-16 shannon robertson female 25 3353 arroyo santa maria deannahernandez@hotmail.com +universidad del salvador actuario 2020-10-16 kimberly huff female 33 2631 cora ineal@gmail.com +universidad del salvador farmacia 2020-10-16 chad white male 23 6312 ricardo lavalle sean80@yahoo.com +universidad del salvador licenciatura en artes 2020-10-16 richard jones male 26 2763 flamenco denise94@hotmail.com +universidad del salvador licenciatura en ciencias de la educación 2020-10-16 jonathan kim male 33 3261 centella dnielsen@gmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-10-16 anthony benton male 35 7220 funke aaron46@yahoo.com +universidad del salvador licenciatura en ciencia política 2020-10-16 carol douglas female 23 1871 dock sud crodriguez@hotmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-10-16 kayla dixon female 33 8353 aguada chacay co ryanwilliams@yahoo.com +universidad del salvador farmacia 2020-10-16 joseph gardner male 21 5741 13 de enero hmartin@yahoo.com +universidad del salvador licenciatura en artes 2020-10-17 george barrera male 25 6417 casbas fharris@hotmail.com +universidad del salvador licenciatura en ciencias ambientales 2020-10-17 jared rollins male 24 8315 achico houstonalexander@gmail.com +universidad del salvador actuario 2020-10-17 nicholas johnson male 21 3224 la blanqueada jonathan79@hotmail.com +universidad del salvador ingeniería mecánica 2020-10-17 regina thomas female 23 1653 villa ballester robin52@yahoo.com +universidad del salvador licenciatura en ciencias biológicas 2020-10-17 dalton roman male 25 8172 arroyo corto rebeccaross@hotmail.com +universidad del salvador licenciatura en musicoterapia 2020-10-17 christopher harper male 19 8185 campo del norte americano robertcallahan@hotmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-10-17 james werner male 37 4111 aguada levinelaurie@hotmail.com +universidad del salvador licenciatura en artes 2020-10-17 bryan king male 25 1832 lomas de zamora charlesbailey@hotmail.com +universidad del salvador actuario 2020-10-17 lisa bell female 18 6553 la torrecita sara34@gmail.com +universidad del salvador medicina 2020-10-18 connie moore female 19 6030 edmundo perkins williamsbrian@hotmail.com +universidad del salvador licenciatura en musicoterapia 2020-10-18 edward gomez male 31 3114 aldea maria luisa brownsergio@yahoo.com +universidad del salvador arquitectura 2020-10-18 joseph davis male 27 9407 28 de noviembre michele61@gmail.com +universidad del salvador licenciatura en ciencia política 2020-10-18 jesse graham male 17 2801 alto verde davidcarolyn@yahoo.com +universidad del salvador diseño industrial 2020-10-18 brian gillespie male 26 8000 adela corti michaelhampton@gmail.com +universidad del salvador contador público 2020-10-18 catherine moreno female 25 3425 costa grande johnsonjeffrey@yahoo.com +universidad del salvador contador público 2020-10-18 victoria smith female 27 2103 colonia escribano farmercheryl@yahoo.com +universidad del salvador contador público 2020-10-18 destiny powers female 31 3700 barrio gral jose de san martin hicksdenise@yahoo.com +universidad del salvador diseño de imagen y sonido 2020-10-18 debra cohen female 17 2123 campo calvo merritttamara@hotmail.com +universidad del salvador licenciatura en ciencias geológicas 2020-10-18 michelle cross female 17 3453 ifran tclarke@hotmail.com +universidad del salvador contador público 2020-10-18 paul cannon male 23 6665 ernestina codydecker@gmail.com +universidad del salvador bioquímica 2020-10-18 maureen nguyen female 27 7507 el bombero fwilliams@yahoo.com +universidad del salvador licenciatura en ciencias biológicas 2020-10-18 dawn freeman female 33 5636 favelli flawson@yahoo.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-10-18 daniel holloway male 33 6511 hale robertmendez@gmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-10-19 tammy schmitt female 25 2806 las palmas roy73@hotmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-10-19 misty snow female 19 8501 bahia creek qerickson@hotmail.com +universidad del salvador licenciatura en ciencias biológicas 2020-10-19 eric howard male 27 1865 el pampero ifrazier@yahoo.com +universidad del salvador licenciatura en ciencias antropológicas 2020-10-19 cameron mitchell male 25 2743 arroyo dulce sjones@hotmail.com +universidad del salvador licenciatura en relaciones del trabajo 2020-10-19 james peterson male 33 2826 aldea san antonio cpeterson@hotmail.com +universidad del salvador licenciatura en ciencia política 2020-10-19 derek smith male 39 2764 campo la nena wperkins@hotmail.com +universidad del salvador diseño industrial 2020-10-19 stephen ponce male 23 7521 deferrari mariawilson@gmail.com +universidad del salvador licenciatura en relaciones del trabajo 2020-10-19 raymond lewis male 25 8318 challaco michaelrobbins@yahoo.com +universidad del salvador técnico para bioterios 2020-10-19 amy lopez female 35 1653 villa ballester orivers@gmail.com +universidad del salvador licenciatura en producción de bioimagenes 2020-10-19 amy harper female 19 8203 la chirlandia jeffreylewis@gmail.com +universidad del salvador licenciatura en musicoterapia 2020-10-19 meagan cooper female 31 7531 despeñaderos mgarcia@hotmail.com +universidad del salvador licenciatura en ciencias ambientales 2020-10-19 todd harrell male 29 1885 guillermo e hudson kellyproctor@yahoo.com +universidad del salvador diseño industrial 2020-10-19 amy oliver female 27 8319 campamento sol conradshawn@gmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-10-19 alexandra saunders female 26 3230 arbol solo theresasharp@gmail.com +universidad del salvador bioquímica 2020-10-19 adam sanders male 17 7407 libano taylorkeller@yahoo.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-10-20 william kemp male 29 3204 ayui parada kennedyjoseph@gmail.com +universidad del salvador licenciatura en ciencias biológicas 2020-10-20 elizabeth greer female 21 9310 aguada alegre ricemelissa@gmail.com +universidad del salvador ingeniería en informática 2020-10-20 charlene cunningham female 19 5881 cañada la negra henrylonnie@yahoo.com +universidad del salvador ingeniería en informática 2020-10-20 michelle meyer female 33 5449 aguango marisajohnson@yahoo.com +universidad del salvador licenciatura en terapia ocupacional 2020-10-20 michael carrillo male 29 8407 correntoso mthomas@gmail.com +universidad del salvador licenciatura en ciencias de la educación 2020-10-20 james mendoza male 23 2136 san geronimo kimberly73@hotmail.com +universidad del salvador licenciatura en producción de bioimagenes 2020-10-20 william adkins male 33 2943 ireneo portela matthew76@hotmail.com +universidad del salvador bioquímica 2020-10-20 william white male 27 4103 bajo de raco stephanie57@hotmail.com +universidad del salvador farmacia 2020-10-20 debbie christian female 19 5623 atuel sud psmall@yahoo.com +universidad del salvador licenciatura en ciencias antropológicas 2020-10-20 reginald alvarado male 19 1712 castelar hudsonjessica@yahoo.com +universidad del salvador medicina 2020-10-20 albert mitchell male 39 7612 camet olivia25@yahoo.com +universidad del salvador licenciatura en ciencias ambientales 2020-10-20 elizabeth maddox female 25 3522 el retiro bwilliams@yahoo.com +universidad del salvador licenciatura en musicoterapia 2020-10-20 sherri yu female 35 9041 los antiguos robertarias@yahoo.com +universidad del salvador licenciatura en musicoterapia 2020-10-20 joe rogers male 17 1897 manuel b gonnet johnsonmichele@hotmail.com +universidad del salvador licenciatura en psicología 2020-10-21 jane mcbride female 24 3372 cataratas del iguazu natashagates@yahoo.com +universidad del salvador licenciatura en artes 2020-10-21 aaron moore male 22 3374 el porvenir nicole59@yahoo.com +universidad del salvador ingeniería en informática 2020-10-21 jessica flores female 25 5607 colonia bombal y tabanera jacksonlindsey@hotmail.com +universidad del salvador diseño de imagen y sonido 2020-10-21 alyssa morales female 19 3224 la blanqueada zcochran@yahoo.com +universidad del salvador licenciatura en ciencia política 2020-10-21 roberta peterson female 25 7136 adela priceelizabeth@gmail.com +universidad del salvador licenciatura en psicología 2020-10-21 shawn sheppard male 35 5713 balde ahumada bryan94@yahoo.com +universidad del salvador medicina 2020-10-21 james jackson male 27 8101 calderon wnelson@hotmail.com +universidad del salvador licenciatura en ciencia política 2020-10-21 brenda mcgrath female 27 2181 los molinos omoyer@yahoo.com +universidad del salvador técnico para bioterios 2020-10-21 dawn martin female 27 9111 bahia bustamante foxalexandra@hotmail.com +universidad del salvador diseño industrial 2020-10-21 bianca freeman female 31 7114 canal 15 cerro de la gloria saundersdavid@hotmail.com +universidad del salvador diseño de imagen y sonido 2020-10-21 william richardson male 24 6309 alpachiri brownteresa@hotmail.com +universidad del salvador ingeniería electrónica 2020-10-21 rodney moore male 27 3014 angel gallardo ericarobinson@hotmail.com +universidad del salvador ingeniería en informática 2020-10-21 bruce landry male 29 8532 arroyo salado odavis@hotmail.com +universidad del salvador licenciatura en ciencias geológicas 2020-10-21 maria rojas female 19 3541 campo las puertas suejones@hotmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-10-21 george armstrong male 23 6031 de bruyn taramartinez@gmail.com +universidad del salvador contador público 2020-10-21 robert avery male 33 3300 arroyo lewismary@gmail.com +universidad del salvador licenciatura en artes 2020-10-21 daniel rodriguez male 23 6018 colonia los bosques floresjoseph@hotmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-10-22 vanessa vaughn female 29 5707 aguaditas lwolfe@hotmail.com +universidad del salvador actuario 2020-10-22 jamie wilson female 23 4163 huasa pampa norte nelsonbrian@yahoo.com +universidad del salvador diseño industrial 2020-10-22 alicia newman female 29 1774 la salada kelleyaaron@gmail.com +universidad del salvador licenciatura en administración 2020-10-22 diane snyder female 29 5527 colonia santa teresa xhayden@hotmail.com +universidad del salvador licenciatura en ciencias ambientales 2020-10-22 michael edwards male 39 6634 alberti bmay@gmail.com +universidad del salvador ingeniería mecánica 2020-10-22 anthony patel male 37 4506 alegria kellymorales@gmail.com +universidad del salvador ingeniería mecánica 2020-10-22 jeffrey lewis male 31 3569 barros pazos christopher93@yahoo.com +universidad del salvador farmacia 2020-10-23 lisa ryan female 37 5446 balde de leyes sarah60@gmail.com +universidad del salvador técnico para bioterios 2020-10-23 jose herman male 27 4751 agua de dionisio richard73@hotmail.com +universidad del salvador licenciatura en sociología 2020-10-23 deborah tate female 23 7305 antonio de los heros morgan62@yahoo.com +universidad del salvador licenciatura en musicoterapia 2020-10-23 jessica lambert female 29 6403 badano meganweber@yahoo.com +universidad del salvador licenciatura en producción de bioimagenes 2020-10-23 daniel meza male 23 4518 aguas calientes zallen@gmail.com +universidad del salvador licenciatura en ciencias biológicas 2020-10-23 pamela robles female 37 4723 alijilan williambarry@hotmail.com +universidad del salvador diseño de imagen y sonido 2020-10-23 brian howard male 20 3332 capiovi jacob99@hotmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-10-23 susan rivera female 19 7521 deferrari timothy67@yahoo.com +universidad del salvador diseño industrial 2020-10-23 brett roy male 31 5447 agua cercada madisonkelly@hotmail.com +universidad del salvador agronomía 2020-10-23 shawn parks male 21 2752 almacen el descanso randall72@yahoo.com +universidad del salvador licenciatura en musicoterapia 2020-10-23 katrina mitchell female 19 6339 cailomuta dgibson@yahoo.com +universidad del salvador licenciatura en sociología 2020-10-23 john kaiser male 29 5700 alto blanco lisa40@yahoo.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-10-23 eric fitzpatrick male 26 6103 amenabar harrisoncynthia@gmail.com +universidad del salvador licenciatura en ciencias de la educación 2020-10-24 melissa glover female 21 7136 adela thomas45@hotmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-10-24 ronald case male 19 1987 alegre grahamjames@yahoo.com +universidad del salvador licenciatura en ciencias geológicas 2020-10-24 judy martinez female 31 6311 campo de los toros patricia33@yahoo.com +universidad del salvador licenciatura en ciencias antropológicas 2020-10-24 rose frazier female 27 6003 ascencion ijohnson@yahoo.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-10-24 gregory morris male 19 6309 alpachiri millerjoshua@yahoo.com +universidad del salvador licenciatura en ciencias biológicas 2020-10-24 kevin atkinson male 25 2848 berisso cgonzales@hotmail.com +universidad del salvador licenciatura en ciencias biológicas 2020-10-24 misty barber female 21 5735 colonia bella vista anthonydennis@gmail.com +universidad del salvador licenciatura en ciencias ambientales 2020-10-24 nathan scott male 23 3364 2 de mayo nrose@hotmail.com +universidad del salvador contador público 2020-10-24 shane kelly male 19 5636 favelli csanchez@yahoo.com +universidad del salvador diseño industrial 2020-10-24 carlos evans male 19 2409 estrada dodsonterri@yahoo.com +universidad del salvador farmacia 2020-10-24 steven berry male 39 1629 almirante irizar ferrelljason@hotmail.com +universidad del salvador licenciatura en artes 2020-10-24 mary torres female 39 1847 rafael calzada gruiz@gmail.com +universidad del salvador licenciatura en relaciones del trabajo 2020-10-24 danielle rodriguez female 29 5419 baños de la laja walkerdana@yahoo.com +universidad del salvador licenciatura en psicología 2020-10-24 mallory martinez female 27 7005 barker dana01@hotmail.com +universidad del salvador licenciatura en relaciones del trabajo 2020-10-25 aaron rios male 37 2107 alvarez chavezamanda@gmail.com +universidad del salvador diseño industrial 2020-10-25 scott mays male 27 6207 alta italia meredithpena@yahoo.com +universidad del salvador licenciatura en sociología 2020-10-25 michele cain female 31 5571 chivilcoy grace89@gmail.com +universidad del salvador licenciatura en psicología 2020-10-25 ronald williams male 21 5519 alto de las arañas geraldsanchez@hotmail.com +universidad del salvador ingeniería electrónica 2020-10-25 misty davis female 25 5624 kilometro 47 emilylee@hotmail.com +universidad del salvador farmacia 2020-10-25 robert boyd male 35 5531 barrio ferri sandrasanchez@hotmail.com +universidad del salvador contador público 2020-10-25 raymond hubbard male 27 3013 colonia matilde charlesramirez@hotmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-10-25 david woods male 21 9409 isla gran malvina framirez@gmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-10-25 lisa orozco female 25 2119 arminda zhester@gmail.com +universidad del salvador diseño industrial 2020-10-25 megan ward female 37 7500 el carretero cbranch@hotmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-10-25 stephanie hoover female 27 3133 arroyo burgos frank77@yahoo.com +universidad del salvador medicina 2020-10-25 jonathan chung male 19 6667 agustin mosconi denise87@yahoo.com +universidad del salvador licenciatura en ciencias antropológicas 2020-10-25 kevin ali male 25 5386 amana phillip59@gmail.com +universidad del salvador licenciatura en ciencias biológicas 2020-10-25 gary wright male 39 2317 casablanca sstewart@yahoo.com +universidad del salvador licenciatura en ciencias geológicas 2020-10-25 dawn warner female 31 3358 cheroguita curtischerry@yahoo.com +universidad del salvador licenciatura en relaciones del trabajo 2020-10-25 david pope male 23 7543 la primavera chall@gmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-10-26 eileen ford female 17 5529 colonia bombal sandersandrea@gmail.com +universidad del salvador licenciatura en musicoterapia 2020-10-26 karen brown female 17 3338 17 de agosto rmassey@gmail.com +universidad del salvador medicina 2020-10-26 cynthia davenport female 39 7021 alzaga davidmalone@yahoo.com +universidad del salvador diseño industrial 2020-10-26 eric jackson male 31 1876 bernal este karen56@yahoo.com +universidad del salvador diseño de imagen y sonido 2020-10-27 sara holland female 23 7108 costa del este jeffreyfitzgerald@gmail.com +universidad del salvador licenciatura en ciencias geológicas 2020-10-27 javier burgess male 19 3080 colonia pujol joshuarichardson@yahoo.com +universidad del salvador ingeniería mecánica 2020-10-27 chad fox male 23 4161 alongo jamesmiller@yahoo.com +universidad del salvador licenciatura en ciencias biológicas 2020-10-27 carl price male 35 8166 saldungaray andersonmichael@hotmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-10-27 sarah edwards female 25 5385 aguadita johnrose@gmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-10-27 miranda riley female 27 7260 barrio villa saladillo lnash@gmail.com +universidad del salvador licenciatura en administración 2020-10-27 scott hicks male 39 2607 campo quirno crystal67@gmail.com +universidad del salvador técnico para bioterios 2020-10-27 brian lopez male 17 5563 agua amarga miguel54@gmail.com +universidad del salvador licenciatura en administración 2020-10-27 samantha stone female 33 2823 aero club canal bsimmons@yahoo.com +universidad del salvador licenciatura en artes 2020-10-27 jason sparks male 23 5717 el pimpollo tammy47@hotmail.com +universidad del salvador bioquímica 2020-10-27 phyllis gonzalez female 21 6474 campo aristimuño timothy26@gmail.com +universidad del salvador bioquímica 2020-10-27 christian garcia male 19 2919 copacabana elizabethsawyer@hotmail.com +universidad del salvador licenciatura en ciencia política 2020-10-27 david bass male 25 6555 alfalad scottbennett@gmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-10-27 jack martin male 25 1768 ciudad madero michaeladams@yahoo.com +universidad del salvador licenciatura en producción de bioimagenes 2020-10-28 joshua hudson male 31 1923 arroyo del pescado ericwilliams@gmail.com +universidad del salvador arquitectura 2020-10-28 tammy thompson female 37 7106 las toninas mkennedy@gmail.com +universidad del salvador licenciatura en ciencias de la educación 2020-10-28 lance mayo male 23 5703 6 de septiembre uking@yahoo.com +universidad del salvador licenciatura en terapia ocupacional 2020-10-28 matthew hoffman male 37 7225 casalins cleonard@hotmail.com +universidad del salvador medicina 2020-10-28 michael hamilton male 29 1862 america unida robertslisa@gmail.com +universidad del salvador contador público 2020-10-28 alyssa martinez female 31 2903 erezcano julie21@yahoo.com +universidad del salvador agronomía 2020-10-28 ashley miller female 33 2747 coronel isleños wjimenez@hotmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-10-28 kristen arias female 19 1640 acassuso nicholasshepherd@gmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-10-28 tamara kelley female 25 5598 bañado verde catherineroberson@hotmail.com +universidad del salvador ingeniería electrónica 2020-10-28 gabrielle wood female 39 9409 isla gran malvina kmorris@gmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-10-28 andrea kirby female 24 3705 10 de mayo kristie75@gmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-10-28 emma williams female 23 2618 carmen rharvey@gmail.com +universidad del salvador licenciatura en ciencias de la educación 2020-10-29 jessica walsh female 19 2529 piamonte susan41@gmail.com +universidad del salvador ingeniería mecánica 2020-10-29 derrick miller male 37 3451 batelito preed@gmail.com +universidad del salvador licenciatura en ciencias geológicas 2020-10-29 vincent trujillo male 23 8101 calderon douglas08@yahoo.com +universidad del salvador licenciatura en administración 2020-10-29 kenneth park male 27 3113 colonia celina amanda28@gmail.com +universidad del salvador ingeniería en informática 2020-10-29 bridget garcia female 19 7003 aceilan jgomez@hotmail.com +universidad del salvador técnico para bioterios 2020-10-29 cynthia perez female 25 3044 gobernador crespo jared06@gmail.com +universidad del salvador licenciatura en administración 2020-10-29 michelle parks female 18 6389 alegria wsutton@yahoo.com +universidad del salvador licenciatura en psicología 2020-10-29 jodi lambert female 35 1661 bella vista fpaul@yahoo.com +universidad del salvador farmacia 2020-10-29 lisa snyder female 19 5275 agua colorada corey03@hotmail.com +universidad del salvador ingeniería electrónica 2020-10-29 karen gordon female 19 1816 colonia santa rosa robertthomas@hotmail.com +universidad del salvador licenciatura en musicoterapia 2020-10-29 andrew clark male 23 6553 la torrecita grahamjustin@yahoo.com +universidad del salvador medicina 2020-10-29 brian byrd male 17 2813 arroyo de la cruz nelsonsandra@hotmail.com +universidad del salvador bioquímica 2020-10-29 taylor chavez female 17 4147 alto las lechuzas hannahpeterson@yahoo.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-10-29 dawn good female 21 1778 ciudad evita vincentkathy@hotmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-10-29 robert brown male 26 4431 aguas calientes sheltonbobby@hotmail.com +universidad del salvador arquitectura 2020-10-29 kenneth robinson male 35 3164 colonia rivas ucochran@yahoo.com +universidad del salvador licenciatura en ciencias de la computación 2020-10-29 april king female 35 6441 colonia baron hirsch katherine33@gmail.com +universidad del salvador agronomía 2020-10-30 nathan martin male 26 3150 algarrobitos 1ro hansenbryan@hotmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-10-30 angela bishop female 21 3344 2 de julio nicholas82@hotmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-10-30 ashley wright female 37 2144 campo horquesco ebray@yahoo.com +universidad del salvador arquitectura 2020-10-30 charles mason male 21 1876 bernal este csnyder@yahoo.com +universidad del salvador licenciatura en musicoterapia 2020-10-30 eric johnson male 29 1655 jose leon suarez janet67@gmail.com +universidad del salvador contador público 2020-10-30 james navarro male 19 6530 carlos casares angela49@yahoo.com +universidad del salvador medicina 2020-10-30 karen obrien female 21 3361 acaragua tracypark@yahoo.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-10-30 christopher gonzales male 31 7305 antonio de los heros jose32@yahoo.com +universidad del salvador ingeniería en informática 2020-10-30 connor golden male 39 3162 aranguren lhines@yahoo.com +universidad del salvador bioquímica 2020-10-30 bobby wang male 21 3007 empalme san carlos romandaniel@yahoo.com +universidad del salvador licenciatura en ciencias ambientales 2020-10-30 thomas sanchez male 23 6212 adolfo van praet todd46@hotmail.com +universidad del salvador licenciatura en producción de bioimagenes 2020-10-30 cynthia nichols female 33 8407 correntoso cerickson@hotmail.com +universidad del salvador licenciatura en ciencias de la educación 2020-10-30 kevin ramirez male 39 6561 blanca grande agonzales@yahoo.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-10-30 kathryn figueroa female 21 4144 amberes roy52@gmail.com +universidad del salvador diseño industrial 2020-10-30 stephen ross male 31 6051 ingeniero balbin sarahsullivan@yahoo.com +universidad del salvador diseño de imagen y sonido 2020-10-30 michelle patterson female 31 5611 agua rica crosales@hotmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-10-30 debra flores female 27 6628 colonia zambungo sandralarson@yahoo.com +universidad del salvador licenciatura en ciencias antropológicas 2020-10-30 heather chapman female 20 3326 colonia leiva anthony73@yahoo.com +universidad del salvador ciencias veterinarias 2020-10-31 sara davis female 25 6434 palantelen barbaralopez@gmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-10-31 valerie jackson female 39 6431 estacion lago epecuen albert72@yahoo.com +universidad del salvador licenciatura en ciencias de la educación 2020-10-31 john rogers male 22 2820 colonia el potrero jessicaharris@gmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-10-31 robert hutchinson male 27 3536 bocas harold52@gmail.com +universidad del salvador licenciatura en administración 2020-10-31 lisa lewis female 18 3021 campo andino martinezdiane@gmail.com +universidad del salvador licenciatura en relaciones del trabajo 2020-10-31 april davis female 17 6559 recalde johnsonmelissa@hotmail.com +universidad del salvador licenciatura en administración 2020-10-31 kevin ellison male 26 5575 andrade ilewis@hotmail.com +universidad del salvador agronomía 2020-10-31 kathleen sharp female 33 5707 aguaditas gatesnancy@gmail.com +universidad del salvador licenciatura en musicoterapia 2020-10-31 miguel wolf male 29 6712 cortines eblanchard@gmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-10-31 elizabeth lawrence female 27 5770 chacras viejas pclark@hotmail.com +universidad del salvador licenciatura en psicología 2020-10-31 jerry horton male 27 3443 colonia mendez bar troy11@gmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-10-31 dean ward male 29 5645 el cenizo qramirez@gmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-10-31 robert henderson male 33 4142 alto de leiva brookerobbins@gmail.com +universidad del salvador licenciatura en sociología 2020-11-01 sarah jones female 19 6233 condarco watsonangela@gmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-11-01 william gomez male 21 2918 empalme villa constitucion amanda90@yahoo.com +universidad del salvador licenciatura en ciencias antropológicas 2020-11-01 briana morgan female 27 7535 pontaut spencepeter@gmail.com +universidad del salvador bioquímica 2020-11-01 jeffrey bender male 26 2451 colonia la yerba christopher36@yahoo.com +universidad del salvador licenciatura en artes 2020-11-01 april hawkins female 29 8187 bordenave tuckerkristin@yahoo.com +universidad del salvador medicina 2020-11-01 victor gray male 35 7613 calfucura ellisjohnny@hotmail.com +universidad del salvador ingeniería electrónica 2020-11-01 james davis male 33 6330 arturo almaraz aaronjones@gmail.com +universidad del salvador medicina 2020-11-01 dakota wang male 35 6105 cañada seca christopherhogan@hotmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-11-01 sean lambert male 24 2761 estancia santa catalina obrown@yahoo.com +universidad del salvador licenciatura en ciencias geológicas 2020-11-01 martin sherman male 33 8122 la viticola jhorn@gmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-11-01 megan anderson female 25 7200 el gualicho thompsonapril@hotmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-11-01 david murray male 35 5573 colonia delfino lisacastro@yahoo.com +universidad del salvador licenciatura en ciencias ambientales 2020-11-01 tammy rodriguez female 31 3451 batelito westalexis@yahoo.com +universidad del salvador técnico para bioterios 2020-11-02 patricia brown female 17 3199 los laureles eroberts@yahoo.com +universidad del salvador licenciatura en ciencia política 2020-11-02 adam clark male 25 6201 chanilao ymills@gmail.com +universidad del salvador licenciatura en psicología 2020-11-02 gail palmer female 35 4709 san jose de piedra blanca glane@yahoo.com +universidad del salvador licenciatura en ciencias ambientales 2020-11-02 kathleen anderson female 31 4513 alto calilegua wilcoxcaitlin@yahoo.com +universidad del salvador medicina 2020-11-02 jackie taylor female 37 3172 kilometro 208 patricia76@hotmail.com +universidad del salvador diseño industrial 2020-11-02 mary grant female 31 3234 bonpland iowen@gmail.com +universidad del salvador licenciatura en relaciones del trabajo 2020-11-02 katherine anderson female 27 5442 ambas puntillas othompson@hotmail.com +universidad del salvador diseño de imagen y sonido 2020-11-02 jeremy moore male 31 7201 colman wvaldez@hotmail.com +universidad del salvador licenciatura en sociología 2020-11-02 stacy salazar female 29 2456 esmeralda darius52@gmail.com +universidad del salvador actuario 2020-11-02 erica smith female 33 1737 kilometro 77 jocelyn41@gmail.com +universidad del salvador técnico para bioterios 2020-11-02 dylan davis male 37 5607 colonia bombal y tabanera ulynch@gmail.com +universidad del salvador ingeniería en informática 2020-11-02 melody foster female 33 9211 cushamen dodsonmichael@gmail.com +universidad del salvador ingeniería electrónica 2020-11-03 caleb garcia male 33 3574 capilla guadalupe norte justin49@gmail.com +universidad del salvador licenciatura en sociología 2020-11-03 brandon lopez male 39 2512 campo charo julie33@hotmail.com +universidad del salvador licenciatura en ciencia política 2020-11-03 timothy webster male 27 5367 cachiyuyal nicole22@yahoo.com +universidad del salvador licenciatura en ciencias de la computación 2020-11-03 margaret smith female 37 9305 cañada de las vacas davieseddie@yahoo.com +universidad del salvador contador público 2020-11-03 shannon walsh female 18 3040 asuncion maria sbaker@hotmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-11-03 brian morgan male 18 3216 arroyo hondo danielwest@hotmail.com +universidad del salvador licenciatura en artes 2020-11-03 karen grant female 18 1802 aeropuerto ezeiza vevans@yahoo.com +universidad del salvador licenciatura en ciencias geológicas 2020-11-03 jessica munoz female 19 4168 agua blanca victoria81@gmail.com +universidad del salvador licenciatura en psicología 2020-11-03 chad howell male 19 3407 aguay iparsons@yahoo.com +universidad del salvador licenciatura en administración 2020-11-03 sarah phillips female 35 7130 caminera samborombon patricia70@hotmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-11-03 christopher hartman male 27 3052 cañadita shane64@yahoo.com +universidad del salvador licenciatura en psicología 2020-11-03 lisa henson female 23 7167 carilo cynthiahoward@yahoo.com +universidad del salvador ingeniería mecánica 2020-11-03 patrick wright male 23 6063 porvenir paula78@gmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-11-03 edward aguirre male 27 6235 villa sauce ann60@yahoo.com +universidad del salvador ingeniería electrónica 2020-11-03 meghan wallace female 24 3309 arroyo tomas scotttran@gmail.com +universidad del salvador medicina 2020-11-04 robin cardenas female 25 8307 colonia gobernador ayala omcdaniel@yahoo.com +universidad del salvador licenciatura en ciencias geológicas 2020-11-04 sara garcia female 19 7300 azul fullerroberta@yahoo.com +universidad del salvador licenciatura en producción de bioimagenes 2020-11-04 erika carter female 37 3701 almirante brown gloria98@yahoo.com +universidad del salvador licenciatura en ciencias antropológicas 2020-11-04 melissa hill female 27 7540 bathurst estacion akelly@hotmail.com +universidad del salvador licenciatura en ciencia política 2020-11-04 robert booker male 23 7635 el lenguaraz james26@hotmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-11-04 nicholas smith male 24 6216 bagual ufoster@yahoo.com +universidad del salvador diseño de imagen y sonido 2020-11-04 timothy williams male 24 6031 de bruyn chall@yahoo.com +universidad del salvador licenciatura en ciencias geológicas 2020-11-04 justin hampton male 25 4728 chumbicha nicole88@hotmail.com +universidad del salvador ingeniería en informática 2020-11-05 melanie franco female 25 6279 batavia marshallamber@gmail.com +universidad del salvador medicina 2020-11-05 katherine haynes female 20 6661 blas durañona diazbrett@yahoo.com +universidad del salvador medicina 2020-11-05 ryan hill male 19 5350 el molle danielandrea@hotmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-11-05 nathan morris male 33 3592 colonia hardy elizabeth81@hotmail.com +universidad del salvador licenciatura en musicoterapia 2020-11-05 jeffrey hahn male 24 2846 anahi patelmichael@gmail.com +universidad del salvador licenciatura en artes 2020-11-05 luis guerrero male 19 5585 el cipres andrew54@gmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-11-05 scott thomas male 25 9121 aguada de las tejas awest@yahoo.com +universidad del salvador ciencias veterinarias 2020-11-05 jamie baxter female 35 5585 el cipres mark37@gmail.com +universidad del salvador licenciatura en ciencias geológicas 2020-11-05 bradley roberts male 35 2942 baradero gmiller@gmail.com +universidad del salvador contador público 2020-11-05 suzanne ramsey female 35 3327 colonia roca dmoreno@hotmail.com +universidad del salvador licenciatura en ciencias ambientales 2020-11-05 jonathan hart male 39 3474 chavarria malik35@gmail.com +universidad del salvador bioquímica 2020-11-05 colleen olson female 39 8430 costa del rio azul donna21@hotmail.com +universidad del salvador licenciatura en psicología 2020-11-05 jennifer sanchez female 29 5325 alpasinche fostergary@gmail.com +universidad del salvador diseño industrial 2020-11-05 lauren reese female 33 6071 bermudez christopher30@yahoo.com +universidad del salvador farmacia 2020-11-06 kimberly blevins female 25 8508 ambrosio p lezica charles51@yahoo.com +universidad del salvador licenciatura en terapia ocupacional 2020-11-06 melissa reed female 21 5710 la punta lawrence13@hotmail.com +universidad del salvador contador público 2020-11-06 daniel reed male 33 4182 campo la flor los ralos millerlori@hotmail.com +universidad del salvador agronomía 2020-11-06 vanessa chavez female 31 1987 alegre uhaley@hotmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-11-06 anna fuentes female 31 9311 cañadon leon xparker@gmail.com +universidad del salvador farmacia 2020-11-06 kathy williams female 31 4750 agua colorada brooke36@hotmail.com +universidad del salvador licenciatura en ciencia política 2020-11-06 brittany howard female 37 7535 pontaut gregory44@yahoo.com +universidad del salvador ingeniería en informática 2020-11-06 jennifer schwartz female 37 1907 el pino hcamacho@hotmail.com +universidad del salvador licenciatura en ciencias de la educación 2020-11-06 jessica schneider female 31 6451 ancon robert40@yahoo.com +universidad del salvador licenciatura en producción de bioimagenes 2020-11-06 leonard avila male 19 3423 arañita ramirezchristina@hotmail.com +universidad del salvador ingeniería electrónica 2020-11-06 robert brown male 33 3309 arroyo tomas robinperkins@yahoo.com +universidad del salvador licenciatura en relaciones del trabajo 2020-11-06 malik shepherd male 27 6315 colonia baron carol37@hotmail.com +universidad del salvador licenciatura en producción de bioimagenes 2020-11-06 jacob davis male 19 5272 comandante leal mariaferguson@hotmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-11-06 sarah hamilton female 19 7220 funke kayla99@gmail.com +universidad del salvador licenciatura en ciencias de la educación 2020-11-06 sandra cooper female 19 3557 caraguatay thall@yahoo.com +universidad del salvador licenciatura en ciencias biológicas 2020-11-06 jeremy smith male 27 3197 abra guazu katherine12@hotmail.com +universidad del salvador ingeniería en informática 2020-11-06 jonathan reynolds male 19 6050 cuartel vii larrydavis@hotmail.com +universidad del salvador bioquímica 2020-11-07 ricardo morris male 35 6439 bonifacio qdudley@hotmail.com +universidad del salvador actuario 2020-11-07 kimberly kane female 29 5380 chamical rachelbrown@hotmail.com +universidad del salvador licenciatura en administración 2020-11-07 stephen bradley male 24 1870 avellaneda monroeandrew@gmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-11-07 christina parker female 25 4504 23 de agosto michaelwilliams@gmail.com +universidad del salvador licenciatura en artes 2020-11-07 lori bishop female 19 3046 arrascaeta mirandajones@hotmail.com +universidad del salvador licenciatura en ciencias de la educación 2020-11-07 carrie day female 39 5633 ochenta y cuatro otate@yahoo.com +universidad del salvador licenciatura en ciencias biológicas 2020-11-07 emily cooke female 33 8168 sierra de la ventana megan15@yahoo.com +universidad del salvador licenciatura en ciencias ambientales 2020-11-07 herbert sullivan male 31 7631 costa bonita balneario billydixon@hotmail.com +universidad del salvador bioquímica 2020-11-07 louis smith male 31 3425 costa grande jordanrogers@gmail.com +universidad del salvador arquitectura 2020-11-07 anthony thomas male 21 3701 almirante brown sharonfarley@yahoo.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-11-07 rhonda thompson female 22 1627 matheu dterrell@gmail.com +universidad del salvador ingeniería mecánica 2020-11-07 brandon obrien male 20 3187 atencio crystal85@gmail.com +universidad del salvador licenciatura en ciencias biológicas 2020-11-08 brandi fuentes female 21 6237 america qmoyer@hotmail.com +universidad del salvador agronomía 2020-11-08 ronald braun male 37 9031 bajo la cancha paigegoodwin@hotmail.com +universidad del salvador licenciatura en artes 2020-11-08 david stark male 19 3208 colonia ensanche sauce alexanderbullock@yahoo.com +universidad del salvador licenciatura en producción de bioimagenes 2020-11-08 clifford mills male 37 5636 favelli heather68@hotmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-11-08 jared simpson male 25 3302 aguara cua dereknelson@gmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-11-08 timothy rivera male 25 6439 bonifacio cody30@gmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-11-08 leslie schneider female 25 2611 estacion christophersen gregorycarlson@hotmail.com +universidad del salvador técnico para bioterios 2020-11-08 lisa martinez female 24 4124 abra el candado rose80@hotmail.com +universidad del salvador actuario 2020-11-08 alyssa hernandez female 19 3427 abra hughesjessica@gmail.com +universidad del salvador licenciatura en musicoterapia 2020-11-08 ashley mcconnell female 23 1657 11 de septiembre ruthcarter@yahoo.com +universidad del salvador licenciatura en administración 2020-11-08 corey wood male 27 3302 aguara cua audreybest@yahoo.com +universidad del salvador diseño de imagen y sonido 2020-11-08 heather holmes female 27 5505 carbometal jennifer37@hotmail.com +universidad del salvador ciencias veterinarias 2020-11-08 sarah cruz female 29 7406 aldecon rhondacarlson@hotmail.com +universidad del salvador farmacia 2020-11-08 paula johns female 20 4633 san pedro de iruya zcaldwell@yahoo.com +universidad del salvador ciencias veterinarias 2020-11-09 angela lewis female 31 2505 campo la riviere lhicks@hotmail.com +universidad del salvador bioquímica 2020-11-09 samuel davidson male 19 1625 arroyo canelon shawnwhite@hotmail.com +universidad del salvador licenciatura en ciencias geológicas 2020-11-09 jason mcdonald male 39 7160 la union codygilmore@hotmail.com +universidad del salvador ingeniería mecánica 2020-11-09 tracy cortez female 23 3534 colonia el aguara kbarnes@yahoo.com +universidad del salvador ciencias veterinarias 2020-11-09 karina hogan female 33 2854 dos hermanas jason43@yahoo.com +universidad del salvador arquitectura 2020-11-09 amber rodriguez female 25 5384 punta de los llanos yangmarc@yahoo.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-11-09 katherine johnson female 17 7641 balneario los angeles psoto@yahoo.com +universidad del salvador licenciatura en sociología 2020-11-09 melanie cox female 25 4600 algarrobal cassandrameyers@hotmail.com +universidad del salvador licenciatura en sociología 2020-11-09 lauren shepard female 26 6706 est jauregui va flandria bpeterson@hotmail.com +universidad del salvador ciencias veterinarias 2020-11-09 joanna sanchez female 37 5427 apeadero quiroga kmontgomery@hotmail.com +universidad del salvador técnico para bioterios 2020-11-09 richard nguyen male 27 8328 allen johnsonchristine@yahoo.com +universidad del salvador licenciatura en ciencias de la computación 2020-11-09 emily schmidt female 19 6538 la dorita jennifer20@hotmail.com +universidad del salvador licenciatura en musicoterapia 2020-11-09 nicole carter female 33 6106 aaron castellanos jasongreen@yahoo.com +universidad del salvador ingeniería en informática 2020-11-10 sherri fry female 23 8103 garro wlawson@hotmail.com +universidad del salvador licenciatura en ciencias ambientales 2020-11-10 sandra norman female 33 1706 haedo kcohen@hotmail.com +universidad del salvador licenciatura en administración 2020-11-10 sean mendoza male 25 2512 campo charo larry27@gmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-11-10 aaron price male 17 1911 bme bavio gral mansilla brandtrenee@gmail.com +universidad del salvador licenciatura en ciencias ambientales 2020-11-10 joann turner female 25 1771 mercado central scottgentry@hotmail.com +universidad del salvador ingeniería en informática 2020-11-10 matthew holt male 19 5372 nonogasta barbara91@gmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-11-10 sarah zamora female 27 7407 libano hmercer@yahoo.com +universidad del salvador licenciatura en ciencias biológicas 2020-11-10 william carroll male 27 9103 bajo de los huesos nelsonbrian@hotmail.com +universidad del salvador licenciatura en musicoterapia 2020-11-10 kimberly edwards female 23 2454 cañada rosquin craigcampos@gmail.com +universidad del salvador diseño industrial 2020-11-10 denise miller female 35 1643 beccar marcrussell@hotmail.com +universidad del salvador licenciatura en artes 2020-11-10 matthew armstrong male 17 7000 cantera aguirre ocohen@hotmail.com +universidad del salvador medicina 2020-11-10 christopher reed male 37 8168 sierra de la ventana bkerr@gmail.com +universidad del salvador licenciatura en sociología 2020-11-10 vincent santos male 39 6407 girodias bphillips@hotmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-11-10 jillian burke female 31 5589 chapanay lisaarmstrong@gmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-11-10 david smith male 23 5743 la isabel autumnpayne@hotmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-11-10 christina davis female 24 3355 arrechea ygarrett@hotmail.com +universidad del salvador medicina 2020-11-11 haley fuller female 35 1611 don torcuato stonealexander@hotmail.com +universidad del salvador medicina 2020-11-11 christopher kirk male 26 8126 aldea san andres weeksrobert@hotmail.com +universidad del salvador licenciatura en artes 2020-11-11 robert wright male 29 3460 arroyo castillo richard83@yahoo.com +universidad del salvador contador público 2020-11-11 drew davis male 31 3116 aldea chaleco kathleen94@yahoo.com +universidad del salvador arquitectura 2020-11-11 summer irwin female 24 7313 16 de julio leesusan@hotmail.com +universidad del salvador licenciatura en administración 2020-11-11 jessica rodriguez female 29 7108 costa del este mnelson@hotmail.com +universidad del salvador diseño industrial 2020-11-11 robert patel male 27 3551 campo monte la viruela michael81@yahoo.com +universidad del salvador licenciatura en terapia ocupacional 2020-11-11 mikayla stevens female 19 3372 cataratas del iguazu frank35@hotmail.com +universidad del salvador licenciatura en sociología 2020-11-11 ryan george male 19 9011 bahia langara joseph71@hotmail.com +universidad del salvador arquitectura 2020-11-11 kristin ellis female 39 1647 zona delta san fernando trios@yahoo.com +universidad del salvador licenciatura en sociología 2020-11-11 sara carr female 17 3162 aranguren chrissmith@yahoo.com +universidad del salvador actuario 2020-11-11 sarah byrd female 21 6433 arturo vatteone xavierdelacruz@hotmail.com +universidad del salvador diseño industrial 2020-11-11 michael tran male 19 4000 estacion de zootecnia b frank85@yahoo.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-11-11 lori contreras female 27 9210 cuesta del ternero etaylor@hotmail.com +universidad del salvador licenciatura en producción de bioimagenes 2020-11-12 michael maddox male 29 7150 ayacucho christopher67@gmail.com +universidad del salvador licenciatura en psicología 2020-11-12 elizabeth liu female 23 2751 almacen castro prestonscott@hotmail.com +universidad del salvador licenciatura en ciencias geológicas 2020-11-12 anthony lopez male 25 1931 punta lara monroebrenda@yahoo.com +universidad del salvador ingeniería electrónica 2020-11-12 chad gonzales male 27 7267 alvarez de toledo robert24@hotmail.com +universidad del salvador bioquímica 2020-11-12 amy molina female 37 1731 villars christine26@yahoo.com +universidad del salvador licenciatura en psicología 2020-11-12 julia brooks female 25 1770 aldo bonzi oliviastewart@gmail.com +universidad del salvador licenciatura en ciencias de la educación 2020-11-12 joshua carter male 27 4718 barro negro gvillanueva@hotmail.com +universidad del salvador licenciatura en ciencias geológicas 2020-11-12 matthew davis male 25 3705 10 de mayo wrightkathleen@hotmail.com +universidad del salvador ingeniería mecánica 2020-11-12 jorge perez male 17 6244 banderalo jasminerussell@gmail.com +universidad del salvador licenciatura en artes 2020-11-12 sean neal male 37 5446 balde de leyes phamjonathon@hotmail.com +universidad del salvador licenciatura en ciencias de la educación 2020-11-12 adam mahoney male 35 4751 agua de dionisio twalsh@yahoo.com +universidad del salvador diseño de imagen y sonido 2020-11-12 heather clark female 27 4107 aconquija gpayne@yahoo.com +universidad del salvador contador público 2020-11-12 richard duarte male 23 2454 cañada rosquin tpollard@yahoo.com +universidad del salvador agronomía 2020-11-12 melissa hernandez female 37 5770 chacras viejas lewisrandy@gmail.com +universidad del salvador bioquímica 2020-11-12 nicole chaney female 24 3107 colonia avellaneda evaughn@hotmail.com +universidad del salvador licenciatura en psicología 2020-11-12 pam torres female 27 7408 la colina davidwall@hotmail.com +universidad del salvador licenciatura en artes 2020-11-12 vanessa leon female 25 8501 bahia creek cbenton@gmail.com +universidad del salvador ingeniería electrónica 2020-11-12 joseph thomas male 39 6032 blandengues ericwaters@hotmail.com +universidad del salvador licenciatura en musicoterapia 2020-11-13 pamela davis female 39 4434 anta allenmichael@gmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-11-13 michele rivera female 25 9305 cañada de las vacas helen20@hotmail.com +universidad del salvador arquitectura 2020-11-13 jennifer wilson female 21 5724 alto pencoso smithmichelle@yahoo.com +universidad del salvador licenciatura en sociología 2020-11-13 kelly davis female 23 5340 agua grande joseph37@hotmail.com +universidad del salvador licenciatura en psicología 2020-11-13 matthew terrell male 33 1648 rincon de milberg zimmermanamanda@gmail.com +universidad del salvador bioquímica 2020-11-13 eric simon male 23 7400 barrio la luisa michaeladams@hotmail.com +universidad del salvador bioquímica 2020-11-13 jason howard male 23 6727 gouin bhull@hotmail.com +universidad del salvador bioquímica 2020-11-13 denise floyd female 27 6621 anderson eric14@yahoo.com +universidad del salvador licenciatura en ciencias ambientales 2020-11-13 kendra hill female 22 6612 capdepont calebsims@hotmail.com +universidad del salvador actuario 2020-11-13 emily leonard female 29 1613 los polvorines evansrobin@gmail.com +universidad del salvador licenciatura en psicología 2020-11-13 mary porter female 33 1919 base aeronaval punta indio rasmussenmark@hotmail.com +universidad del salvador licenciatura en sociología 2020-11-13 michael webster male 25 3228 cabi monda davilajeffrey@yahoo.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-11-13 ana webb female 39 3414 abra williamseric@yahoo.com +universidad del salvador licenciatura en ciencias geológicas 2020-11-13 joseph clark male 25 2918 empalme villa constitucion lwilliams@gmail.com +universidad del salvador ciencias veterinarias 2020-11-14 timothy dickerson male 31 2255 campo rodriguez christophermyers@hotmail.com +universidad del salvador medicina 2020-11-14 john lee male 23 7515 claudio c molina john66@gmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-11-14 dylan williams male 23 1876 bernal este sandersrandy@gmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-11-14 kimberly collins female 21 4751 agua de dionisio rthomas@yahoo.com +universidad del salvador diseño de imagen y sonido 2020-11-14 gregory stafford male 31 3164 colonia rivas john40@yahoo.com +universidad del salvador licenciatura en ciencias ambientales 2020-11-14 emily reynolds female 33 3500 colonia florencia ugibson@hotmail.com +universidad del salvador licenciatura en musicoterapia 2020-11-14 krystal gibson female 27 3269 arroyo baru fdiaz@hotmail.com +universidad del salvador diseño industrial 2020-11-14 nicole sanders female 29 1647 zona delta san fernando yclark@hotmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-11-14 sandra snyder female 25 9015 alma grande floresmeghan@yahoo.com +universidad del salvador técnico para bioterios 2020-11-14 crystal johnson female 17 7543 la primavera hrose@gmail.com +universidad del salvador diseño de imagen y sonido 2020-11-14 jonathan conner male 33 2409 estrada loganporter@yahoo.com +universidad del salvador licenciatura en ciencias biológicas 2020-11-14 shelby blackwell female 31 8214 colonia cazaux christina23@hotmail.com +universidad del salvador licenciatura en ciencias de la educación 2020-11-14 christine munoz female 35 6300 barrancas coloradas jacob22@hotmail.com +universidad del salvador farmacia 2020-11-14 zachary miller male 22 7613 calfucura lisanixon@gmail.com +universidad del salvador ingeniería mecánica 2020-11-14 tyler wilson male 31 3481 angostura glenncruz@gmail.com +universidad del salvador licenciatura en ciencias ambientales 2020-11-14 luis mcdaniel male 23 3085 pilar townsendana@gmail.com +universidad del salvador ingeniería mecánica 2020-11-15 sara ayala female 21 6417 casbas landerson@hotmail.com +universidad del salvador contador público 2020-11-15 erika barr female 29 7135 comandante giribone justinwalter@hotmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-11-15 jordan hansen female 23 3085 pilar carolynduke@hotmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-11-15 kimberly owens female 27 3526 gandolfi iwoodward@yahoo.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-11-15 kelly cobb female 33 4168 agua blanca dawsondarren@gmail.com +universidad del salvador licenciatura en ciencias geológicas 2020-11-15 brian schmidt male 29 2103 colonia escribano lcastro@gmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-11-15 nicole atkins female 19 3465 arroyo casco bradadams@gmail.com +universidad del salvador licenciatura en administración 2020-11-15 brian moore male 23 7111 san bernardo del tuyu robertdickson@gmail.com +universidad del salvador contador público 2020-11-15 jennifer rodriguez female 21 1882 ezpeleta este lewiserik@gmail.com +universidad del salvador licenciatura en ciencias biológicas 2020-11-16 christopher barnett male 27 8126 aldea san andres keith11@gmail.com +universidad del salvador licenciatura en administración 2020-11-16 matthew hodge male 35 2721 el arbolito rodriguezjennifer@yahoo.com +universidad del salvador licenciatura en ciencias de la computación 2020-11-16 tammy clark female 25 5331 andalucia brendahunt@yahoo.com +universidad del salvador licenciatura en producción de bioimagenes 2020-11-16 wanda jones female 31 2134 roldan thomasporter@yahoo.com +universidad del salvador licenciatura en psicología 2020-11-16 nicole hale female 19 6341 chapi talo kathy93@hotmail.com +universidad del salvador arquitectura 2020-11-16 erica wheeler female 21 1804 canning jasonsanchez@hotmail.com +universidad del salvador ingeniería electrónica 2020-11-16 anthony blair male 23 9001 cañadon ferrais jeanettejohnson@gmail.com +universidad del salvador licenciatura en psicología 2020-11-16 michael webb male 26 6645 la limpia brittney20@yahoo.com +universidad del salvador contador público 2020-11-16 brendan stark male 17 2529 piamonte hopkinsgerald@gmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-11-16 michele wiley female 27 3080 colonia pujol zmontoya@hotmail.com +universidad del salvador contador público 2020-11-16 john carroll male 23 5738 avanzada thorntonrobert@yahoo.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-11-16 bryan murray male 35 2508 armstrong jessica40@gmail.com +universidad del salvador licenciatura en administración 2020-11-16 jamie miller female 35 7530 coronel pringles xhall@yahoo.com +universidad del salvador licenciatura en terapia ocupacional 2020-11-17 jamie harvey female 23 5403 barrialitos lauren93@gmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-11-17 brittney hamilton female 39 6064 eduardo costa erica82@gmail.com +universidad del salvador licenciatura en sociología 2020-11-17 monica campbell female 37 2253 campo gimenez imorris@gmail.com +universidad del salvador medicina 2020-11-17 carrie morris female 25 2617 sancti spiritu samuelmiller@yahoo.com +universidad del salvador licenciatura en relaciones del trabajo 2020-11-17 brianna blackwell female 33 2187 arteaga jamesbennett@hotmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-11-17 jason farley male 21 6516 amalia uhayes@yahoo.com +universidad del salvador licenciatura en ciencias geológicas 2020-11-17 james phillips male 19 2115 colonia valdez wbryan@yahoo.com +universidad del salvador ingeniería mecánica 2020-11-17 laura mcgee female 25 8311 villa el chocon wilkinsjoshua@yahoo.com +universidad del salvador medicina 2020-11-17 leslie brown female 21 2403 bauer y sigel floresheidi@yahoo.com +universidad del salvador licenciatura en artes 2020-11-17 breanna levy female 24 3575 arroyo ceibal jasoncampbell@gmail.com +universidad del salvador actuario 2020-11-17 michelle porter female 33 8154 calvo fosterbenjamin@yahoo.com +universidad del salvador licenciatura en musicoterapia 2020-11-17 benjamin vasquez male 17 8129 17 de agosto annettekoch@yahoo.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-11-17 linda leonard female 31 5311 arauco martinfrancisco@hotmail.com +universidad del salvador medicina 2020-11-17 mariah martinez female 21 5572 alto grande kingchristy@hotmail.com +universidad del salvador licenciatura en relaciones del trabajo 2020-11-17 jeffrey quinn male 17 6424 beruti emartinez@gmail.com +universidad del salvador licenciatura en ciencias biológicas 2020-11-18 april rose female 21 8168 sierra de la ventana vanessa38@yahoo.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-11-18 stephen scott male 37 5438 alto de sierra alison13@gmail.com +universidad del salvador diseño de imagen y sonido 2020-11-18 ryan rojas male 35 3555 campo huber kellymcmillan@yahoo.com +universidad del salvador licenciatura en artes 2020-11-18 susan smith female 23 1895 arturo segui sarajohnson@hotmail.com +universidad del salvador contador público 2020-11-18 fernando boyd male 37 7531 despeñaderos sotokevin@hotmail.com +universidad del salvador medicina 2020-11-18 danny cannon male 37 8303 cinco saltos kimberlywyatt@yahoo.com +universidad del salvador licenciatura en psicología 2020-11-18 brianna lucas female 29 1676 santos lugares miacastillo@gmail.com +universidad del salvador farmacia 2020-11-18 mike patton male 29 3214 estacion yerua jarvisjennifer@gmail.com +universidad del salvador arquitectura 2020-11-18 linda rios female 27 8418 anecon chico kellyprice@hotmail.com +universidad del salvador agronomía 2020-11-18 juan mann male 25 5544 gobernador benegas aguirrejennifer@gmail.com +universidad del salvador licenciatura en ciencias biológicas 2020-11-18 amanda smith female 37 3222 buen retiro williamsallison@gmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-11-18 evelyn gonzalez female 23 2409 estrada christopher21@hotmail.com +universidad del salvador licenciatura en producción de bioimagenes 2020-11-19 manuel thompson male 27 2617 sancti spiritu dhawkins@gmail.com +universidad del salvador técnico para bioterios 2020-11-19 frank villa male 27 1650 general san martin qhamilton@yahoo.com +universidad del salvador licenciatura en ciencia política 2020-11-19 heather parker female 35 4133 la banda warnererin@hotmail.com +universidad del salvador ingeniería electrónica 2020-11-19 elizabeth sparks female 33 6748 membrillar clin@hotmail.com +universidad del salvador licenciatura en sociología 2020-11-19 daniel lopez male 25 6661 blas durañona obriendavid@gmail.com +universidad del salvador ciencias veterinarias 2020-11-19 jordan gonzalez female 39 5773 cañada kjackson@gmail.com +universidad del salvador arquitectura 2020-11-20 david randolph male 23 6616 castilla leahedwards@yahoo.com +universidad del salvador licenciatura en producción de bioimagenes 2020-11-20 antonio lee male 31 6441 colonia baron hirsch sgutierrez@hotmail.com +universidad del salvador ingeniería mecánica 2020-11-20 audrey flowers female 37 5577 el alto steven90@yahoo.com +universidad del salvador agronomía 2020-11-20 susan simmons female 29 2214 aldao sarah17@gmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-11-20 austin green male 25 1716 libertad rhardin@hotmail.com +universidad del salvador licenciatura en producción de bioimagenes 2020-11-20 chad kelley male 31 3016 san jose gharris@hotmail.com +universidad del salvador licenciatura en producción de bioimagenes 2020-11-20 amanda lawson female 17 6503 desvio kilometro 234 samanthaowen@yahoo.com +universidad del salvador licenciatura en ciencias de la computación 2020-11-20 derrick moore male 33 5577 el alto omar43@yahoo.com +universidad del salvador licenciatura en relaciones del trabajo 2020-11-20 cindy torres female 21 5266 chichagasta bensonjames@gmail.com +universidad del salvador licenciatura en ciencia política 2020-11-20 leah andrews female 24 3105 diamante lovenatasha@gmail.com +universidad del salvador agronomía 2020-11-20 regina bauer female 23 3050 calchaqui hwells@yahoo.com +universidad del salvador diseño de imagen y sonido 2020-11-20 jody williams female 20 3454 bañado san antonio fowlerwilliam@hotmail.com +universidad del salvador diseño industrial 2020-11-21 steven reeves male 31 3357 barra bonita knappjennifer@gmail.com +universidad del salvador licenciatura en ciencias ambientales 2020-11-21 shannon becker female 29 6533 alfredo demarchi uthomas@yahoo.com +universidad del salvador agronomía 2020-11-21 richard miller male 37 3448 alamo justin89@hotmail.com +universidad del salvador licenciatura en producción de bioimagenes 2020-11-21 raymond andrews male 23 6101 villa saboya paulhamilton@gmail.com +universidad del salvador licenciatura en administración 2020-11-21 carol blake female 25 5591 alpatacal danielburch@gmail.com +universidad del salvador bioquímica 2020-11-21 anthony baird male 25 1665 jose clemente paz hernandezandrew@hotmail.com +universidad del salvador licenciatura en ciencia política 2020-11-21 bradley anderson male 23 5636 favelli cochranbrittany@gmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-11-22 marc burton male 17 7226 gorchs jordanrobert@yahoo.com +universidad del salvador diseño industrial 2020-11-22 courtney ramirez female 17 9301 el chalten sarah63@yahoo.com +universidad del salvador arquitectura 2020-11-22 james porter male 21 1907 el pino hward@yahoo.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-11-22 stacey russell female 29 8430 costa del rio azul jennifer99@yahoo.com +universidad del salvador licenciatura en ciencias ambientales 2020-11-22 kenneth smith male 27 8113 baterias daniellelee@yahoo.com +universidad del salvador diseño de imagen y sonido 2020-11-22 larry herrera male 39 3575 arroyo ceibal danielsjean@yahoo.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-11-22 amy rhodes female 39 6665 ernestina traceysharp@hotmail.com +universidad del salvador arquitectura 2020-11-22 daniel short male 39 6205 el guanaco cindyhall@yahoo.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-11-22 kaitlin wade female 17 7212 doctor domingo harosteguy luiscarter@yahoo.com +universidad del salvador arquitectura 2020-11-22 lauren gonzalez female 33 6505 dudignac williamssamuel@yahoo.com +universidad del salvador licenciatura en producción de bioimagenes 2020-11-22 ana phillips female 37 2747 coronel isleños linda96@hotmail.com +universidad del salvador farmacia 2020-11-22 scott mccarthy male 23 6531 algarrobo jon76@yahoo.com +universidad del salvador licenciatura en ciencias geológicas 2020-11-22 marcus murphy male 27 7201 colman tylerallison@yahoo.com +universidad del salvador ciencias veterinarias 2020-11-22 molly curtis female 37 3423 arañita anna26@yahoo.com +universidad del salvador agronomía 2020-11-22 amber graham female 19 6361 agustoni kristinacompton@yahoo.com +universidad del salvador farmacia 2020-11-22 tracy gibbs female 37 1888 florencio varela thomastammy@gmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-11-22 laurie brown female 25 1642 san isidro michael35@hotmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-11-22 tina berg female 23 1649 zona delta tigre bowersnatalie@yahoo.com +universidad del salvador agronomía 2020-11-23 mary bailey female 37 1862 america unida reginachurch@gmail.com +universidad del salvador licenciatura en ciencias de la educación 2020-11-23 mary townsend female 26 8364 chimpay thoffman@gmail.com +universidad del salvador licenciatura en producción de bioimagenes 2020-11-23 lisa rogers female 27 7169 juancho wrightmichael@yahoo.com +universidad del salvador licenciatura en ciencias de la educación 2020-11-23 brian cruz male 35 5565 campo de los andes sjohnson@gmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-11-23 laura smith female 25 3503 barranqueras robert73@yahoo.com +universidad del salvador licenciatura en ciencias antropológicas 2020-11-23 patricia martin female 37 6003 ascencion thodges@gmail.com +universidad del salvador técnico para bioterios 2020-11-23 joshua bell male 17 6325 colonia devoto andrestate@yahoo.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-11-24 leslie macdonald female 19 1893 centro agricola el pato lewiskristen@hotmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-11-24 bradley hernandez male 37 7313 16 de julio sandrawebster@hotmail.com +universidad del salvador arquitectura 2020-11-24 mark johnson male 24 4724 agua colorada browntravis@hotmail.com +universidad del salvador licenciatura en administración 2020-11-24 joanna key female 17 7106 las toninas elizabeth94@gmail.com +universidad del salvador ingeniería mecánica 2020-11-24 patricia munoz female 29 2643 cafferata amiller@yahoo.com +universidad del salvador bioquímica 2020-11-24 laurie schmitt female 17 2617 sancti spiritu traviswalker@gmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-11-24 dustin wright male 27 2345 campo botto zmoreno@hotmail.com +universidad del salvador ingeniería mecánica 2020-11-24 jennifer olsen female 19 2156 arsenal de guerra san lorenzo sheltoncrystal@yahoo.com +universidad del salvador actuario 2020-11-24 barbara perez female 17 4503 arrayanal clarkmichael@gmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-11-24 jacob sparks male 24 3240 colonia egido cassie03@yahoo.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-11-25 john english male 35 3405 algarrobal puisoye eringarcia@hotmail.com +universidad del salvador licenciatura en ciencias biológicas 2020-11-25 brian clark male 35 2138 carcaraña fernando28@hotmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-11-25 jessica stewart female 33 4624 abra mayo brenda74@yahoo.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-11-25 alyssa george female 26 3536 bocas stacey81@gmail.com +universidad del salvador licenciatura en producción de bioimagenes 2020-11-25 kelly henry female 19 3083 grutly millerjared@yahoo.com +universidad del salvador licenciatura en psicología 2020-11-25 david mccoy male 27 5436 colonia zapata allenronnie@gmail.com +universidad del salvador licenciatura en ciencias geológicas 2020-11-25 timothy aguirre male 23 3486 villa olivari dyoung@yahoo.com +universidad del salvador diseño de imagen y sonido 2020-11-25 kirk robinson male 31 5724 alto pencoso xthompson@yahoo.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-11-25 kyle gross male 17 7174 arroyo grande randylong@yahoo.com +universidad del salvador licenciatura en producción de bioimagenes 2020-11-25 mary lee female 35 8316 balsa senillosa adamhill@hotmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-11-25 nicole hopkins female 20 5260 acheral christopher41@gmail.com +universidad del salvador técnico para bioterios 2020-11-25 rachel johnson female 25 2300 colonia bella italia uwilson@hotmail.com +universidad del salvador ingeniería en informática 2020-11-25 dale long male 19 1761 20 de junio matthew93@gmail.com +universidad del salvador diseño industrial 2020-11-25 michelle holmes female 39 6422 primera junta gonzalezvanessa@yahoo.com +universidad del salvador licenciatura en ciencias ambientales 2020-11-25 kristine sullivan female 23 1884 berazategui flowersjames@yahoo.com +universidad del salvador licenciatura en ciencias de la educación 2020-11-25 matthew gutierrez male 31 3308 candelaria tiffanydavis@yahoo.com +universidad del salvador licenciatura en psicología 2020-11-25 carlos smith male 26 4723 alijilan matthew57@yahoo.com +universidad del salvador licenciatura en ciencias de la computación 2020-11-26 john jenkins male 25 6660 25 de mayo reynoldskenneth@gmail.com +universidad del salvador ingeniería en informática 2020-11-26 pamela mayo female 23 4740 agua salada juliejones@hotmail.com +universidad del salvador licenciatura en musicoterapia 2020-11-26 timothy wilson male 25 5419 baños de la laja anthony97@gmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-11-26 jordan griffin male 26 6070 balsa kristinbaldwin@yahoo.com +universidad del salvador licenciatura en relaciones del trabajo 2020-11-26 lindsay obrien female 27 4119 agua colorada ifarrell@gmail.com +universidad del salvador licenciatura en psicología 2020-11-26 christie thomas female 25 2501 berretta dbrooks@yahoo.com +universidad del salvador licenciatura en ciencia política 2020-11-26 richard stevens male 33 5436 colonia zapata terry03@hotmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-11-26 tiffany jones female 31 1905 jose ferrari nolson@yahoo.com +universidad del salvador licenciatura en relaciones del trabajo 2020-11-27 timothy anderson male 33 5609 aristides villanueva kingwendy@hotmail.com +universidad del salvador licenciatura en sociología 2020-11-27 sharon randolph female 39 2741 el retiro mckinneykimberly@yahoo.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-11-27 jessica ford female 27 5709 bañadito viejo jamespalmer@gmail.com +universidad del salvador ingeniería electrónica 2020-11-27 zachary fisher male 35 7136 adela kprice@yahoo.com +universidad del salvador técnico para bioterios 2020-11-27 sue hughes female 21 4139 agua amarilla la hoyada sandrajimenez@gmail.com +universidad del salvador licenciatura en artes 2020-11-27 theresa johnson female 25 5545 agua de diaz harveykelsey@gmail.com +universidad del salvador agronomía 2020-11-27 craig young male 23 3306 centinela daniel34@gmail.com +universidad del salvador licenciatura en ciencias ambientales 2020-11-27 robert mcclure male 37 8347 arroyo cahunco matthewbeck@hotmail.com +universidad del salvador ingeniería en informática 2020-11-27 debbie craig female 24 2609 colonia morgan dharvey@gmail.com +universidad del salvador licenciatura en psicología 2020-11-27 courtney jones female 23 6433 arturo vatteone michelleford@yahoo.com +universidad del salvador licenciatura en ciencias geológicas 2020-11-27 mary rodriguez female 35 3732 colonia abate kelly27@yahoo.com +universidad del salvador licenciatura en ciencia política 2020-11-27 sandy reyes female 17 2119 arminda emilyboyle@yahoo.com +universidad del salvador licenciatura en relaciones del trabajo 2020-11-28 amanda cox female 27 2761 estancia santa catalina vcampbell@gmail.com +universidad del salvador técnico para bioterios 2020-11-28 amber lopez female 17 6743 coliqueo campbellallen@hotmail.com +universidad del salvador ingeniería mecánica 2020-11-28 tara tran female 37 5474 barranquitas patelmackenzie@yahoo.com +universidad del salvador ingeniería electrónica 2020-11-28 edward wheeler male 33 7223 bonnement burnettbrian@yahoo.com +universidad del salvador farmacia 2020-11-28 howard cohen male 17 5500 cerro aconcagua michaelnichols@yahoo.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-11-28 colleen smith female 25 7107 santa teresita nharvey@gmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-11-28 david flores male 19 3177 altamirano norte flowerskaitlyn@gmail.com +universidad del salvador ingeniería mecánica 2020-11-28 gary davies male 33 5521 los corredores pbrady@gmail.com +universidad del salvador licenciatura en producción de bioimagenes 2020-11-28 renee williams female 24 2136 san geronimo victoria69@gmail.com +universidad del salvador licenciatura en ciencias de la educación 2020-11-28 elizabeth taylor female 31 6601 altamira mcculloughmary@yahoo.com +universidad del salvador licenciatura en producción de bioimagenes 2020-11-28 heather fisher female 25 9035 arroyo chalia erin73@gmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-11-28 timothy medina male 35 3125 antonio tomas erin20@yahoo.com +universidad del salvador técnico para bioterios 2020-11-28 susan young female 17 2258 campo quiñones amy45@yahoo.com +universidad del salvador licenciatura en ciencias ambientales 2020-11-28 michele alvarez female 21 5383 agua colorada christine92@yahoo.com +universidad del salvador medicina 2020-11-29 gregory benitez male 21 6031 de bruyn collinsjennifer@hotmail.com +universidad del salvador licenciatura en relaciones del trabajo 2020-11-29 theresa hudson female 39 5612 valle de las leñas bonillamichael@gmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-11-29 yvonne mcintosh female 23 6279 batavia kimberlyscott@hotmail.com +universidad del salvador licenciatura en administración 2020-11-29 joshua harris male 35 3513 arbol solo oliviarivera@hotmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-11-29 sarah aguirre female 20 7503 cristiano muerto paul08@gmail.com +universidad del salvador licenciatura en relaciones del trabajo 2020-11-29 katherine rodriguez female 29 1895 arturo segui deborah45@yahoo.com +universidad del salvador arquitectura 2020-11-29 david baker male 31 6634 alberti christiansmith@gmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-11-29 amber mann female 29 1636 la lucila susan22@hotmail.com +universidad del salvador licenciatura en artes 2020-11-29 christopher owens male 31 7313 16 de julio stephanie42@yahoo.com +universidad del salvador licenciatura en musicoterapia 2020-11-29 kelly montoya female 17 2109 acebal darrenhampton@yahoo.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-11-30 julia chapman female 27 2603 chapuy juliewarren@yahoo.com +universidad del salvador técnico para bioterios 2020-11-30 nicholas king male 27 7605 barrio chapadmalal tinameyer@yahoo.com +universidad del salvador licenciatura en administración 2020-11-30 julie macias female 19 4709 san jose de piedra blanca habbott@gmail.com +universidad del salvador técnico para bioterios 2020-11-30 christopher chambers male 23 6405 30 de agosto matthewvasquez@yahoo.com +universidad del salvador licenciatura en ciencias geológicas 2020-11-30 maureen mccall female 25 6461 capitan castro stephen46@hotmail.com +universidad del salvador licenciatura en relaciones del trabajo 2020-11-30 bradley wright male 22 5531 barrio ferri paula34@gmail.com +universidad del salvador contador público 2020-11-30 cassie blackwell female 35 1713 barrio parque leloir angelaramos@yahoo.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-11-30 bethany henderson female 35 7263 el chumbeau hendersonadrienne@hotmail.com +universidad del salvador licenciatura en administración 2020-11-30 emily foley female 37 6607 anasagasti andreathomas@yahoo.com +universidad del salvador licenciatura en sociología 2020-11-30 patrick pearson male 27 6551 juan f ibarra cphillips@gmail.com +universidad del salvador ciencias veterinarias 2020-11-30 devin mccoy male 27 1642 san isidro darrenryan@hotmail.com +universidad del salvador licenciatura en administración 2020-11-30 rhonda callahan female 19 2907 general conesa ibrown@yahoo.com +universidad del salvador licenciatura en ciencias de la computación 2020-11-30 james rogers male 23 5613 agua botada james06@hotmail.com +universidad del salvador ciencias veterinarias 2020-11-30 david barber male 17 2721 el arbolito tammy18@yahoo.com +universidad del salvador licenciatura en ciencias antropológicas 2020-11-30 darrell griffin male 29 5424 villa lerga bradley12@gmail.com +universidad del salvador contador público 2020-12-01 stacey watts female 35 8402 dina huapi reginalddavis@gmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-12-01 zachary mcdonald male 17 4115 agua azul bowenalison@hotmail.com +universidad del salvador ciencias veterinarias 2020-12-01 christopher roberts male 23 3344 2 de julio perrymatthew@yahoo.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-12-01 dennis ford male 35 3718 amambay annette41@hotmail.com +universidad del salvador farmacia 2020-12-01 brian alexander male 19 9001 cañadon ferrais avilayvette@yahoo.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-12-01 rachel krueger female 37 9009 cañadon lagarto chavezjohn@yahoo.com +universidad del salvador licenciatura en ciencias antropológicas 2020-12-01 jenna huber female 39 3412 albardon dadams@gmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-12-01 courtney grant female 27 3230 arbol solo michael11@gmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-12-01 brandon jones male 19 9200 arroyo pescado denise90@gmail.com +universidad del salvador licenciatura en producción de bioimagenes 2020-12-01 sandra perez female 25 6663 juan vela ujacobs@hotmail.com +universidad del salvador licenciatura en producción de bioimagenes 2020-12-02 karl reed male 33 2342 campo el mataco nwatkins@yahoo.com +universidad del salvador licenciatura en ciencias de la educación 2020-12-02 teresa velasquez female 35 6531 algarrobo michaelnelson@gmail.com +universidad del salvador medicina 2020-12-02 patrick williams male 35 1893 centro agricola el pato johnsondonna@gmail.com +universidad del salvador agronomía 2020-12-02 taylor kramer male 33 8401 cullin manzano courtney43@hotmail.com +universidad del salvador bioquímica 2020-12-02 linda christian female 23 8422 aguada de piedra james55@gmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-12-02 natalie smith female 37 5424 villa lerga franklin28@yahoo.com +universidad del salvador agronomía 2020-12-02 matthew romero male 19 7112 aguas verdes joseph54@gmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-12-02 brianna houston female 29 9213 cañadon caliente crystal13@yahoo.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-12-02 benjamin miller male 33 3530 aldea forestal cooperadriana@gmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-12-02 james burns male 17 1611 don torcuato jking@hotmail.com +universidad del salvador contador público 2020-12-02 russell martin male 17 8172 arroyo corto tyler82@gmail.com +universidad del salvador licenciatura en producción de bioimagenes 2020-12-02 heather walker female 25 8500 el dique charles32@yahoo.com +universidad del salvador licenciatura en ciencia política 2020-12-02 erin beard female 33 5622 colonia jauregui kaylacole@gmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-12-02 shannon anderson female 21 6301 ataliva roca tcruz@yahoo.com +universidad del salvador ingeniería mecánica 2020-12-02 madison small female 29 8512 igarzabal bowenbrett@yahoo.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-12-03 amy arnold female 19 6309 alpachiri quinnalisha@gmail.com +universidad del salvador medicina 2020-12-03 mary mercado female 26 3705 10 de mayo copelandamy@gmail.com +universidad del salvador licenciatura en sociología 2020-12-03 kathy fowler female 37 5612 valle de las leñas dking@hotmail.com +universidad del salvador ciencias veterinarias 2020-12-03 brett flores male 39 9201 cachel rebeccaperez@yahoo.com +universidad del salvador licenciatura en ciencias ambientales 2020-12-03 mary davis female 27 5438 alto de sierra westerin@hotmail.com +universidad del salvador licenciatura en artes 2020-12-03 brenda shepherd female 23 3040 asuncion maria brittney50@hotmail.com +universidad del salvador diseño de imagen y sonido 2020-12-03 courtney castro female 37 9113 florentino ameghino angela75@yahoo.com +universidad del salvador diseño de imagen y sonido 2020-12-03 jeffrey kelley male 39 3716 campo largo xjohnson@gmail.com +universidad del salvador licenciatura en ciencia política 2020-12-03 allison roach female 21 2613 la morocha kristina87@hotmail.com +universidad del salvador licenciatura en ciencias geológicas 2020-12-03 stephen hernandez male 25 3105 diamante briannarodriguez@hotmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-12-04 frank pruitt male 39 7621 la sara lejohn@yahoo.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-12-04 julie smith female 35 3226 buena vista karencruz@yahoo.com +universidad del salvador licenciatura en musicoterapia 2020-12-04 mikayla gray female 35 4132 agua azul lori87@hotmail.com +universidad del salvador licenciatura en ciencias de la educación 2020-12-04 robert richardson male 39 1642 san isidro joelcole@gmail.com +universidad del salvador licenciatura en ciencia política 2020-12-04 jeremy smith male 17 8431 el hoyo todd40@yahoo.com +universidad del salvador bioquímica 2020-12-04 amanda strong female 20 9000 comodoro rivadavia jrojas@hotmail.com +universidad del salvador agronomía 2020-12-04 paula walker female 29 8172 arroyo corto daltonjustin@gmail.com +universidad del salvador licenciatura en relaciones del trabajo 2020-12-04 deborah lee female 39 4601 corral de piedras cfisher@yahoo.com +universidad del salvador bioquímica 2020-12-04 beth dixon female 27 5572 alto grande wyatt89@hotmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-12-04 emily fowler female 18 7620 balcarce xmay@gmail.com +universidad del salvador ciencias veterinarias 2020-12-04 kelsey johnson female 39 3386 caraguatay eturner@hotmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-12-04 michelle castillo female 17 9041 los antiguos christophermorales@yahoo.com +universidad del salvador licenciatura en ciencias antropológicas 2020-12-04 jennifer petersen female 19 4612 carahunco wdorsey@hotmail.com +universidad del salvador licenciatura en artes 2020-12-04 jamie compton female 35 5717 el pimpollo kimberly66@hotmail.com +universidad del salvador licenciatura en musicoterapia 2020-12-04 gary lane male 27 3005 colonia california fosterjeffrey@hotmail.com +universidad del salvador licenciatura en psicología 2020-12-05 john smith male 39 6309 alpachiri timothy61@gmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-12-05 robert navarro male 21 3416 arroyo ceibal chungstephen@yahoo.com +universidad del salvador licenciatura en producción de bioimagenes 2020-12-05 bonnie stevens female 21 2311 adolfo alsina coffeywilliam@hotmail.com +universidad del salvador licenciatura en ciencias ambientales 2020-12-05 derek bailey male 31 2349 colonia dos rosas y la legua haleyrodriguez@yahoo.com +universidad del salvador licenciatura en psicología 2020-12-06 blake cook male 27 8156 el perdido est jose guisasola jacksonamy@yahoo.com +universidad del salvador licenciatura en ciencia política 2020-12-06 brittany bradshaw female 22 6312 ricardo lavalle harrissean@hotmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-12-06 karen stanley female 23 5461 aguada de la peña hornejason@yahoo.com +universidad del salvador licenciatura en ciencias ambientales 2020-12-06 jennifer clark female 26 2301 bella italia pricesteven@hotmail.com +universidad del salvador agronomía 2020-12-06 haley andrews female 39 5261 agua del simbol sean04@gmail.com +universidad del salvador ingeniería electrónica 2020-12-06 rebecca holmes female 23 5417 9 de julio tylerdecker@hotmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-12-06 beth nelson female 27 6516 amalia ashley22@hotmail.com +universidad del salvador licenciatura en relaciones del trabajo 2020-12-06 teresa hardy female 27 4740 agua salada stewartstacey@yahoo.com +universidad del salvador licenciatura en terapia ocupacional 2020-12-06 sherri gross female 21 3218 arroyo palmar deleonsara@hotmail.com +universidad del salvador licenciatura en artes 2020-12-06 christine curry female 29 3381 maria magdalena wilsonchristopher@hotmail.com +universidad del salvador ingeniería mecánica 2020-12-07 brett vargas male 35 6435 guamini savila@hotmail.com +universidad del salvador farmacia 2020-12-07 leslie bryan female 21 2725 hughes changchristine@gmail.com +universidad del salvador licenciatura en sociología 2020-12-07 julie norman female 25 5563 agua amarga elliottdouglas@yahoo.com +universidad del salvador medicina 2020-12-07 shannon allen female 17 7605 barrio chapadmalal lchavez@gmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-12-07 lisa white female 23 1822 valentin alsina sherrera@hotmail.com +universidad del salvador contador público 2020-12-07 jason rodriguez male 19 3101 aldea brasilera ashleyenglish@yahoo.com +universidad del salvador diseño de imagen y sonido 2020-12-07 eric griffith male 27 1808 alejandro petion frostbeth@yahoo.com +universidad del salvador licenciatura en psicología 2020-12-07 denise gilbert female 21 5547 villa hipodromo freed@hotmail.com +universidad del salvador licenciatura en artes 2020-12-07 brian ray male 25 1903 abasto sean56@yahoo.com +universidad del salvador bioquímica 2020-12-07 richard griffith male 23 4105 abra del tafi ramseyalex@yahoo.com +universidad del salvador licenciatura en psicología 2020-12-07 christopher cooke male 20 5759 calera argentina jamieboyle@yahoo.com +universidad del salvador licenciatura en producción de bioimagenes 2020-12-07 tracy schaefer female 25 1828 banfield xbrown@hotmail.com +universidad del salvador diseño industrial 2020-12-07 angela malone female 21 6476 chiclana ryanjimenez@gmail.com +universidad del salvador medicina 2020-12-07 robyn mccarty female 37 4501 abra del trigo sharon50@hotmail.com +universidad del salvador licenciatura en ciencias geológicas 2020-12-07 justin davis male 26 5571 chivilcoy gouldlaura@yahoo.com +universidad del salvador técnico para bioterios 2020-12-07 brian tanner male 39 3136 alcaraz norte tiffanyholt@gmail.com +universidad del salvador licenciatura en relaciones del trabajo 2020-12-07 jennifer taylor female 23 3425 costa grande roserichard@gmail.com +universidad del salvador licenciatura en ciencias geológicas 2020-12-07 patricia howard female 26 3052 cañadita michaelwilson@hotmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-12-07 kristin rogers female 31 8417 cañadon chileno michaelharrison@yahoo.com +universidad del salvador medicina 2020-12-08 david armstrong male 27 3188 colonia falco jimmyfernandez@gmail.com +universidad del salvador medicina 2020-12-08 kimberly hopkins female 21 2187 arteaga ajones@hotmail.com +universidad del salvador diseño industrial 2020-12-08 brandon barry male 33 4139 agua amarilla la hoyada heather53@yahoo.com +universidad del salvador licenciatura en ciencias de la educación 2020-12-08 jason hardin male 23 1723 mariano acosta mark10@gmail.com +universidad del salvador licenciatura en artes 2020-12-08 jill gardner female 23 3272 colonia 1 de mayo jenkinsjeremy@hotmail.com +universidad del salvador ciencias veterinarias 2020-12-08 catherine duncan female 31 9401 el zurdo brooksmonique@yahoo.com +universidad del salvador licenciatura en sociología 2020-12-08 jeffrey kim male 31 5435 algarrobo grande maryconley@gmail.com +universidad del salvador bioquímica 2020-12-08 suzanne reynolds female 31 6022 la oriental vnelson@yahoo.com +universidad del salvador medicina 2020-12-08 belinda anderson female 25 5883 alto lindo hayley27@hotmail.com +universidad del salvador licenciatura en ciencias de la educación 2020-12-08 angela martin female 19 2942 baradero wmarshall@hotmail.com +universidad del salvador licenciatura en producción de bioimagenes 2020-12-08 john hendricks male 37 5525 buena vista donald26@gmail.com +universidad del salvador agronomía 2020-12-08 jason villegas male 25 2806 las palmas john30@hotmail.com +universidad del salvador diseño industrial 2020-12-08 john mitchell male 33 5645 el cenizo richardgonzales@hotmail.com +universidad del salvador licenciatura en ciencias ambientales 2020-12-08 alicia bridges female 25 5736 comandante granville davidruiz@yahoo.com +universidad del salvador ingeniería electrónica 2020-12-08 william malone male 25 5543 3 de mayo blakegibson@hotmail.com +universidad del salvador contador público 2020-12-09 jennifer moss female 31 2943 ireneo portela allison27@gmail.com +universidad del salvador diseño de imagen y sonido 2020-12-09 martin bailey male 39 2603 chapuy brownzachary@yahoo.com +universidad del salvador licenciatura en musicoterapia 2020-12-09 amanda white female 19 1907 el pino ehaley@yahoo.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-12-09 elizabeth jones female 25 1678 caseros dominiquepage@gmail.com +universidad del salvador licenciatura en ciencia política 2020-12-09 eric clark male 33 5572 alto grande heathernguyen@hotmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-12-09 lauren clements female 31 6361 agustoni peterromero@gmail.com +universidad del salvador licenciatura en ciencias de la educación 2020-12-09 ryan jones male 33 2451 colonia la yerba mark29@hotmail.com +universidad del salvador ingeniería mecánica 2020-12-09 christopher ward male 37 5383 agua colorada cheryl77@gmail.com +universidad del salvador actuario 2020-12-09 andrea moody female 39 2501 berretta robertsoto@hotmail.com +universidad del salvador licenciatura en ciencias biológicas 2020-12-09 amy hicks female 25 4139 agua amarilla la hoyada zriley@gmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-12-09 briana gonzalez female 17 3515 capitan solari harrismike@gmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-12-09 christy navarro female 31 4187 anta chica tony37@hotmail.com +universidad del salvador actuario 2020-12-09 jennifer jones female 29 6201 chanilao christopherrose@gmail.com +universidad del salvador arquitectura 2020-12-10 jeremiah singleton male 17 3360 arroyo fedor jenniferbartlett@yahoo.com +universidad del salvador licenciatura en musicoterapia 2020-12-10 diane guzman female 31 2821 arroyo del cura williamsamanda@hotmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-12-10 crystal cantrell female 19 7103 faro san antonio jessica77@hotmail.com +universidad del salvador ingeniería electrónica 2020-12-10 cheryl cruz female 37 1828 banfield charlenebarker@gmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-12-10 robert lawrence male 17 4133 la banda dominguezscott@hotmail.com +universidad del salvador ingeniería electrónica 2020-12-10 michelle shaw female 17 1896 camino centenario km 11500 raymond31@yahoo.com +universidad del salvador licenciatura en producción de bioimagenes 2020-12-10 beth carey female 19 8316 balsa senillosa keithowens@gmail.com +universidad del salvador licenciatura en musicoterapia 2020-12-10 christine williams female 37 6746 cucha cucha angel92@yahoo.com +universidad del salvador técnico para bioterios 2020-12-10 james johnson male 23 9037 aldea beleiro pachecodean@yahoo.com +universidad del salvador actuario 2020-12-10 juan taylor male 39 4164 bajastine juliehenry@hotmail.com +universidad del salvador técnico para bioterios 2020-12-10 robert graves male 29 9023 buen pasto dsparks@yahoo.com +universidad del salvador diseño de imagen y sonido 2020-12-10 shawn tucker male 21 5743 la isabel barnettvalerie@yahoo.com +universidad del salvador ciencias veterinarias 2020-12-10 desiree curtis female 39 7641 balneario los angeles andrew22@gmail.com +universidad del salvador farmacia 2020-12-10 denise sanchez female 29 5743 la isabel hilladam@gmail.com +universidad del salvador contador público 2020-12-10 rachel ramos female 39 6513 colonia las yescas ywaller@yahoo.com +universidad del salvador licenciatura en relaciones del trabajo 2020-12-11 mike sharp male 31 7307 crotto zhooper@yahoo.com +universidad del salvador contador público 2020-12-11 tammy flores female 25 6352 colonia la india michael50@hotmail.com +universidad del salvador licenciatura en ciencias geológicas 2020-12-11 robert nicholson male 31 3138 alcaraz 2do courtneylewis@gmail.com +universidad del salvador ingeniería en informática 2020-12-11 ryan smith male 22 1663 muñiz cindy93@gmail.com +universidad del salvador licenciatura en ciencias de la educación 2020-12-11 william kirk male 35 3718 amambay frank65@hotmail.com +universidad del salvador farmacia 2020-12-11 robert mueller male 23 4411 sey jonesstephen@gmail.com +universidad del salvador licenciatura en producción de bioimagenes 2020-12-11 philip robinson male 17 3530 aldea forestal tylerturner@gmail.com +universidad del salvador licenciatura en ciencias biológicas 2020-12-12 mary conner female 23 3465 arroyo casco wmarsh@gmail.com +universidad del salvador técnico para bioterios 2020-12-12 jonathan johnson male 23 3732 colonia abate fwilson@hotmail.com +universidad del salvador licenciatura en ciencias biológicas 2020-12-12 michelle floyd female 25 6634 alberti angelaparsons@gmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-12-12 troy christian male 23 5471 agua blanca lvazquez@gmail.com +universidad del salvador licenciatura en ciencias biológicas 2020-12-12 patricia garcia female 23 4000 estacion de zootecnia b carterjuan@hotmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-12-12 ashlee peterson female 35 6652 olascoaga bryanwells@gmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-12-12 ashley robinson female 25 1911 bme bavio gral mansilla garybennett@yahoo.com +universidad del salvador licenciatura en producción de bioimagenes 2020-12-12 mary green female 35 2527 colonia san francisco christinarichardson@yahoo.com +universidad del salvador farmacia 2020-12-12 joel richardson male 19 4503 arrayanal singletonjames@yahoo.com +universidad del salvador actuario 2020-12-12 ryan turner male 23 3705 10 de mayo heatherharris@yahoo.com +universidad del salvador licenciatura en artes 2020-12-12 justin chase male 35 8118 cabildo wjones@hotmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-12-12 lisa mcbride female 19 7021 alzaga thompsoncraig@hotmail.com +universidad del salvador ingeniería mecánica 2020-12-13 glenn meza male 19 4103 bajo de raco jhart@yahoo.com +universidad del salvador ingeniería en informática 2020-12-13 eric randolph male 39 8370 caminera destinycollins@hotmail.com +universidad del salvador ciencias veterinarias 2020-12-13 jason frost male 17 7165 faro querandi amandapearson@yahoo.com +universidad del salvador licenciatura en ciencias biológicas 2020-12-13 ann mckee female 39 3109 colonia centenario kristytaylor@yahoo.com +universidad del salvador licenciatura en ciencia política 2020-12-13 douglas gonzalez male 18 7509 oriente lauraball@hotmail.com +universidad del salvador licenciatura en ciencia política 2020-12-13 charles rivera male 21 3208 colonia ensanche sauce davidcurry@hotmail.com +universidad del salvador ingeniería en informática 2020-12-13 mark lewis male 17 9409 isla gran malvina zfrost@gmail.com +universidad del salvador licenciatura en ciencias geológicas 2020-12-13 daniel craig male 25 6641 comodoro py qdennis@yahoo.com +universidad del salvador medicina 2020-12-13 ethan perry male 35 3583 isla tigre dianarussell@yahoo.com +universidad del salvador bioquímica 2020-12-13 bryan kane male 29 2713 manuel ocampo weaverrodney@gmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-12-14 jordan herring female 33 6507 corbett gonzalezshawn@gmail.com +universidad del salvador ciencias veterinarias 2020-12-14 gregory sparks male 17 3287 aldea san gregorio mariamitchell@gmail.com +universidad del salvador ingeniería mecánica 2020-12-14 melissa craig female 37 5755 alto del molle eklein@gmail.com +universidad del salvador licenciatura en producción de bioimagenes 2020-12-14 teresa navarro female 24 1664 trujui andreagardner@gmail.com +universidad del salvador licenciatura en sociología 2020-12-14 heather avila female 29 1735 el durazno grahamryan@hotmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-12-14 john lucas male 26 3241 campo de villamil wramirez@gmail.com +universidad del salvador licenciatura en ciencias geológicas 2020-12-14 james conley male 19 2740 almacen la colina aprilbell@yahoo.com +universidad del salvador licenciatura en ciencias de la educación 2020-12-14 henry jones male 25 3731 meson de fierro morriscraig@gmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-12-14 ronald davis male 31 6346 pellegrini rickysellers@hotmail.com +universidad del salvador licenciatura en psicología 2020-12-14 jason moore male 37 6228 aguas buenas jessica38@hotmail.com +universidad del salvador ingeniería electrónica 2020-12-14 john little male 31 6311 campo de los toros jsmith@yahoo.com +universidad del salvador ingeniería en informática 2020-12-15 mark klein male 19 6075 arenaza joshuabennett@hotmail.com +universidad del salvador actuario 2020-12-15 cheryl jacobs female 17 3732 colonia abate vincent49@yahoo.com +universidad del salvador farmacia 2020-12-15 tracy young female 25 9013 cañadon seco hthomas@hotmail.com +universidad del salvador licenciatura en sociología 2020-12-15 savannah rodriguez female 25 5400 desamparados amycabrera@hotmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-12-15 chloe wilson female 19 3101 aldea brasilera donald67@yahoo.com +universidad del salvador licenciatura en ciencias ambientales 2020-12-15 shelby fitzgerald female 33 5465 baños pismanta nicholssamantha@hotmail.com +universidad del salvador licenciatura en administración 2020-12-15 christine carlson female 27 1602 florida michaelsmith@gmail.com +universidad del salvador contador público 2020-12-15 robert mccarty male 21 2531 landeta romerodevin@hotmail.com +universidad del salvador licenciatura en ciencias biológicas 2020-12-15 monique cruz female 35 5310 aimogasta derek19@gmail.com +universidad del salvador licenciatura en sociología 2020-12-15 tyler cole male 17 6352 colonia la india williamphillips@gmail.com +universidad del salvador diseño de imagen y sonido 2020-12-15 nicole jordan female 37 6103 amenabar teresaalvarez@yahoo.com +universidad del salvador licenciatura en musicoterapia 2020-12-16 tyler sullivan male 33 7113 la lucila del mar renee54@gmail.com +universidad del salvador licenciatura en administración 2020-12-16 jonathan martin male 31 2214 aldao nmills@yahoo.com +universidad del salvador ingeniería en informática 2020-12-16 micheal stein male 17 2344 achaval rodriguez diazronald@hotmail.com +universidad del salvador licenciatura en ciencia política 2020-12-16 patricia williams female 23 5634 bowen alec92@gmail.com +universidad del salvador licenciatura en sociología 2020-12-16 allen luna male 29 2752 almacen el descanso cory21@hotmail.com +universidad del salvador diseño de imagen y sonido 2020-12-16 laura mejia female 33 3180 diego lopez debrasullivan@gmail.com +universidad del salvador técnico para bioterios 2020-12-16 amber garcia female 25 7630 hospital necochea wilkinsjohn@gmail.com +universidad del salvador licenciatura en relaciones del trabajo 2020-12-16 david oliver male 29 2508 armstrong penningtonjason@hotmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-12-16 lauren baker female 17 5775 bajo grande sstewart@hotmail.com +universidad del salvador arquitectura 2020-12-16 pamela weber female 24 6015 campo coliqueo tinacooper@gmail.com +universidad del salvador licenciatura en producción de bioimagenes 2020-12-16 colleen warner female 27 1607 villa adelina genebyrd@yahoo.com +universidad del salvador licenciatura en ciencias de la educación 2020-12-16 kristine dawson female 21 2132 aero club rosario dawn66@yahoo.com +universidad del salvador diseño de imagen y sonido 2020-12-17 jordan bradford female 39 1670 nordelta desireethompson@yahoo.com +universidad del salvador agronomía 2020-12-17 christopher meza male 25 3543 colonia lote 12 cordovapaul@yahoo.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-12-17 kimberly davis female 29 3172 kilometro 208 vthomas@hotmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-12-17 travis decker male 31 9400 an aike vbrowning@gmail.com +universidad del salvador licenciatura en ciencia política 2020-12-17 brandy hood female 39 4726 capayan christopher28@yahoo.com +universidad del salvador licenciatura en ciencias de la computación 2020-12-17 kevin gray male 27 5417 9 de julio ebowman@hotmail.com +universidad del salvador arquitectura 2020-12-17 david mercado male 29 5367 cachiyuyal brandy46@gmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-12-17 justin martinez male 17 3081 cavour crawfordjoel@gmail.com +universidad del salvador licenciatura en relaciones del trabajo 2020-12-17 veronica miller female 19 5551 estacion uspallata brianwilliams@yahoo.com +universidad del salvador actuario 2020-12-17 melissa parks female 35 5570 alto del salvador brendan00@gmail.com +universidad del salvador licenciatura en administración 2020-12-17 holly turner female 23 8416 anecon grande wilsonlogan@yahoo.com +universidad del salvador farmacia 2020-12-17 jeff bryant male 33 1605 carapachay craig17@gmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-12-17 bruce garcia male 27 3041 cacique ariacaiquin fbaker@hotmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-12-17 mark holt male 33 2156 arsenal de guerra san lorenzo austin38@hotmail.com +universidad del salvador ingeniería mecánica 2020-12-17 krista holden female 17 1872 sarandi marcusware@gmail.com +universidad del salvador licenciatura en relaciones del trabajo 2020-12-17 nicholas lawrence male 27 6335 graciarena xjohnson@yahoo.com +universidad del salvador licenciatura en administración 2020-12-18 brittany smith female 31 2845 colonia duportal brianmendez@yahoo.com +universidad del salvador licenciatura en sociología 2020-12-18 dylan harvey male 20 6605 campo peña lopez ruth99@yahoo.com +universidad del salvador licenciatura en ciencias biológicas 2020-12-18 kathleen carter female 23 6317 la florencia cbean@hotmail.com +universidad del salvador diseño de imagen y sonido 2020-12-18 xavier smith male 24 3540 avanzada jonathansmith@yahoo.com +universidad del salvador farmacia 2020-12-18 whitney robinson female 24 7151 langueyu michael10@yahoo.com +universidad del salvador licenciatura en ciencia política 2020-12-18 danielle hall female 39 8127 estela jordansean@yahoo.com +universidad del salvador técnico para bioterios 2020-12-18 brianna long female 26 9011 bahia langara jennifer40@yahoo.com +universidad del salvador licenciatura en ciencias antropológicas 2020-12-18 jenny vance female 25 7220 funke zmiddleton@gmail.com +universidad del salvador licenciatura en sociología 2020-12-18 sheryl martinez female 20 9400 an aike tuckerallison@gmail.com +universidad del salvador bioquímica 2020-12-18 ryan peterson male 33 8400 isla victoria lkelly@yahoo.com +universidad del salvador contador público 2020-12-18 aaron bishop male 23 3005 colonia california jonathan81@yahoo.com +universidad del salvador diseño de imagen y sonido 2020-12-18 mark johnson male 35 9301 el chalten mwilliams@yahoo.com +universidad del salvador licenciatura en administración 2020-12-18 barbara mcdonald female 35 3244 colonia belga americana mariagarza@gmail.com +universidad del salvador ciencias veterinarias 2020-12-18 allison marshall female 27 9305 cañada de las vacas bartonjohn@gmail.com +universidad del salvador licenciatura en ciencias ambientales 2020-12-18 bethany hernandez female 23 1836 llavallol deborahtaylor@gmail.com +universidad del salvador licenciatura en sociología 2020-12-18 nathan franklin male 35 5519 alto de las arañas brittanyforbes@gmail.com +universidad del salvador licenciatura en ciencia política 2020-12-19 rachel rivera female 23 9030 rio mayo hgallegos@gmail.com +universidad del salvador licenciatura en relaciones del trabajo 2020-12-19 michael lewis male 39 1806 tristan suarez williamsmatthew@gmail.com +universidad del salvador diseño industrial 2020-12-19 kimberly henderson female 31 5421 la tranca fstewart@gmail.com +universidad del salvador farmacia 2020-12-19 kim silva female 27 7103 faro san antonio ivan36@gmail.com +universidad del salvador ciencias veterinarias 2020-12-19 randall cline male 21 2242 arijon hayesdaniel@yahoo.com +universidad del salvador licenciatura en musicoterapia 2020-12-19 raymond hudson male 37 1752 lomas del mirador amandajensen@yahoo.com +universidad del salvador licenciatura en ciencias geológicas 2020-12-19 gilbert hanson male 22 5365 el jumeal janicelopez@yahoo.com +universidad del salvador licenciatura en terapia ocupacional 2020-12-19 jordan joseph male 35 3113 colonia celina ysmith@yahoo.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-12-19 brandon schultz male 33 3244 colonia belga americana dale02@gmail.com +universidad del salvador diseño de imagen y sonido 2020-12-19 justin nguyen male 19 6706 est jauregui va flandria porozco@hotmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-12-19 susan elliott female 23 6401 sundblad william67@gmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-12-20 amanda rogers female 37 6212 adolfo van praet natasha58@gmail.com +universidad del salvador licenciatura en musicoterapia 2020-12-20 david west male 27 3718 amambay jessica85@yahoo.com +universidad del salvador licenciatura en ciencias de la educación 2020-12-20 jason wood male 27 8415 arroyo las minas donna48@gmail.com +universidad del salvador licenciatura en relaciones del trabajo 2020-12-20 sarah simon female 35 2324 colonia tacurales kevin81@gmail.com +universidad del salvador licenciatura en administración 2020-12-20 francisco sweeney male 17 9121 aguada de las tejas rmcintosh@hotmail.com +universidad del salvador licenciatura en psicología 2020-12-20 courtney malone female 31 2202 cerana jasonadams@gmail.com +universidad del salvador licenciatura en sociología 2020-12-20 robert beck male 25 8142 colonia barga randyadams@yahoo.com +universidad del salvador licenciatura en relaciones del trabajo 2020-12-21 christine archer female 19 2611 estacion christophersen rcoleman@gmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-12-21 tammy sutton female 37 6472 francisco madero charles28@hotmail.com +universidad del salvador licenciatura en ciencias biológicas 2020-12-21 dustin anderson male 27 7318 colonia hinojo hhoffman@gmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-12-21 lori wright female 39 2812 capilla del señor robin14@hotmail.com +universidad del salvador licenciatura en producción de bioimagenes 2020-12-21 marie park female 22 3360 arroyo fedor jeffgomez@yahoo.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-12-21 christopher morris male 17 2449 avena jsmith@yahoo.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-12-21 donna horn female 31 2400 villani xmitchell@hotmail.com +universidad del salvador licenciatura en ciencia política 2020-12-21 anthony hodges male 21 6305 atreuco nrodriguez@hotmail.com +universidad del salvador licenciatura en relaciones del trabajo 2020-12-21 susan wilcox female 25 2747 coronel isleños alexander72@hotmail.com +universidad del salvador licenciatura en relaciones del trabajo 2020-12-21 mariah griffith female 23 6309 alpachiri robertberg@yahoo.com +universidad del salvador contador público 2020-12-21 ronnie short male 33 9053 aguada grande xnguyen@hotmail.com +universidad del salvador ciencias veterinarias 2020-12-22 julie martin female 39 5551 estacion uspallata sandovalchristy@yahoo.com +universidad del salvador farmacia 2020-12-22 jessica branch female 17 5261 agua del simbol perryashley@gmail.com +universidad del salvador ingeniería electrónica 2020-12-22 keith mcfarland male 21 5715 arbol verde frankwiggins@gmail.com +universidad del salvador ingeniería mecánica 2020-12-22 jill woods female 24 8151 el zorro robertjones@hotmail.com +universidad del salvador licenciatura en musicoterapia 2020-12-22 john parker male 25 3487 puesto de isla johnperry@gmail.com +universidad del salvador licenciatura en musicoterapia 2020-12-22 susan ross female 23 3340 boqueron brookebullock@gmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-12-22 deborah wright female 31 8521 arroyo de la ventana whitneygarza@yahoo.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-12-22 robert reilly male 23 4152 aguilares bradfordshawn@hotmail.com +universidad del salvador diseño industrial 2020-12-22 sabrina moody female 25 7301 ariel vpayne@gmail.com +universidad del salvador ciencias veterinarias 2020-12-22 elizabeth thompson female 37 4616 barcena paulawinters@gmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-12-22 david peterson male 33 5717 el pimpollo william33@gmail.com +universidad del salvador ingeniería electrónica 2020-12-22 brandon kennedy male 27 4561 la chinaca frances05@hotmail.com +universidad del salvador actuario 2020-12-23 paul barron male 33 2828 colonia nueva montevideo nicholemontoya@yahoo.com +universidad del salvador diseño de imagen y sonido 2020-12-23 christopher york male 19 5545 agua de diaz adamskaylee@hotmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-12-23 samuel smith male 17 5386 amana carolynbrown@yahoo.com +universidad del salvador diseño de imagen y sonido 2020-12-23 hector reyes male 35 5549 agua de los manantiales angelamcclain@yahoo.com +universidad del salvador licenciatura en administración 2020-12-23 albert mercer male 37 3400 bañado norte khall@gmail.com +universidad del salvador licenciatura en ciencias biológicas 2020-12-23 raymond molina male 20 7113 la lucila del mar crystalhebert@hotmail.com +universidad del salvador arquitectura 2020-12-23 alexis carter female 21 6537 el camoati laura35@yahoo.com +universidad del salvador licenciatura en psicología 2020-12-23 susan brown female 39 4513 alto calilegua david34@hotmail.com +universidad del salvador licenciatura en ciencias ambientales 2020-12-23 nicholas mendoza male 25 8212 abramo halldillon@yahoo.com +universidad del salvador medicina 2020-12-23 mary white female 31 2633 chovet nicholas19@gmail.com +universidad del salvador licenciatura en ciencia política 2020-12-23 emily johnson female 27 2820 colonia el potrero christianreynolds@yahoo.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-12-23 jamie hart female 31 2943 ireneo portela mmedina@gmail.com +universidad del salvador técnico para bioterios 2020-12-24 miranda zuniga female 25 3232 cabred stephentorres@gmail.com +universidad del salvador farmacia 2020-12-24 ann nguyen female 35 5710 la punta alex32@gmail.com +universidad del salvador ingeniería en informática 2020-12-24 john johnson male 19 3350 apostoles xdiaz@gmail.com +universidad del salvador licenciatura en sociología 2020-12-24 carolyn robinson female 31 6064 eduardo costa sherrymcbride@yahoo.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-12-24 robert mcdaniel male 25 3050 calchaqui scottmichael@yahoo.com +universidad del salvador licenciatura en relaciones del trabajo 2020-12-24 bradley barnes male 39 2933 colonia velez lovevictor@hotmail.com +universidad del salvador licenciatura en relaciones del trabajo 2020-12-24 aaron soto male 29 3281 calera kristirichardson@hotmail.com +universidad del salvador licenciatura en relaciones del trabajo 2020-12-24 travis meadows male 37 1905 jose ferrari ycamacho@hotmail.com +universidad del salvador ingeniería mecánica 2020-12-24 vanessa harris female 23 5533 9 de julio nathan71@yahoo.com +universidad del salvador técnico para bioterios 2020-12-24 patricia cowan female 35 5587 barcala briana86@hotmail.com +universidad del salvador diseño industrial 2020-12-24 stephen wall male 27 3156 betbeder rmoore@yahoo.com +universidad del salvador ingeniería en informática 2020-12-24 mark hamilton male 18 4137 abra baya andersonrobert@gmail.com +universidad del salvador bioquímica 2020-12-24 kelly smith female 22 5565 campo de los andes vanessa75@hotmail.com +universidad del salvador ingeniería mecánica 2020-12-24 michael hanson male 31 2918 empalme villa constitucion millercody@yahoo.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-12-25 anthony diaz male 29 6032 blandengues xortiz@hotmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-12-25 william howard male 24 1737 kilometro 77 jzamora@yahoo.com +universidad del salvador ingeniería mecánica 2020-12-25 nancy livingston female 19 6509 del valle cortezbrittany@yahoo.com +universidad del salvador licenciatura en ciencia política 2020-12-25 nicholas king male 31 2852 alarcon brookssarah@gmail.com +universidad del salvador licenciatura en sociología 2020-12-25 laurie smith female 33 7110 cuartel iv lindsayhenry@hotmail.com +universidad del salvador ingeniería mecánica 2020-12-25 andrew soto male 33 6500 9 de julio maddoxeugene@gmail.com +universidad del salvador diseño de imagen y sonido 2020-12-25 joseph hebert male 24 4146 barrio belgrano willisamy@hotmail.com +universidad del salvador actuario 2020-12-25 kathleen barber female 31 1727 b los aromos san patricio katherinefarley@hotmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-12-25 frank hale male 29 2216 campo raffo castilloronald@gmail.com +universidad del salvador licenciatura en relaciones del trabajo 2020-12-25 bobby moore male 23 8309 centenario jamesgregory@gmail.com +universidad del salvador licenciatura en sociología 2020-12-25 alicia hardin female 39 2105 cañada rica kristina68@hotmail.com +universidad del salvador licenciatura en sociología 2020-12-25 thomas stewart male 26 4743 aconquija sthomas@yahoo.com +universidad del salvador licenciatura en relaciones del trabajo 2020-12-25 kayla webb female 19 6632 benitez jocelyn85@yahoo.com +universidad del salvador licenciatura en ciencias geológicas 2020-12-25 jay sullivan male 19 3231 colonia arocena ina vcook@hotmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-12-25 cynthia carney female 31 5403 barrialitos wilsonkimberly@yahoo.com +universidad del salvador ingeniería mecánica 2020-12-26 wendy nelson female 27 8124 berraondo nhill@gmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-12-26 april hansen female 26 3531 colonia aborigen deborahmiller@yahoo.com +universidad del salvador licenciatura en ciencia política 2020-12-26 haley scott female 18 6537 el camoati matthewrodgers@gmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-12-26 joseph oneal male 35 9039 hito 45 lewischristopher@hotmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-12-26 bryan medina male 23 5565 campo de los andes nancymorton@hotmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-12-26 andrea mckee female 25 2400 villani amanda01@hotmail.com +universidad del salvador ingeniería en informática 2020-12-26 benjamin hughes male 37 6053 el peregrino angela56@hotmail.com +universidad del salvador ingeniería en informática 2020-12-26 audrey dillon female 39 1742 paso del rey jensenjennifer@gmail.com +universidad del salvador licenciatura en ciencia política 2020-12-26 angela anderson female 29 7000 cantera aguirre smithdavid@yahoo.com +universidad del salvador contador público 2020-12-26 david mccoy male 35 2852 alarcon yadams@hotmail.com +universidad del salvador farmacia 2020-12-26 mary tucker female 33 2615 la gama yshaw@hotmail.com +universidad del salvador agronomía 2020-12-27 rachel mason female 27 2500 cañada de gomez garzapatricia@hotmail.com +universidad del salvador licenciatura en terapia ocupacional 2020-12-27 charles jones male 19 8136 algarrobo pyoung@hotmail.com +universidad del salvador licenciatura en ciencias ambientales 2020-12-27 alex hurley male 31 4624 abra mayo carolyn25@gmail.com +universidad del salvador ingeniería electrónica 2020-12-27 patricia morris female 19 3164 colonia rivas wolfdanielle@hotmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-12-27 daniel nelson male 37 2000 villa angelica asalazar@hotmail.com +universidad del salvador licenciatura en ciencias de la educación 2020-12-27 brooke bush female 33 2138 carcaraña isaacford@hotmail.com +universidad del salvador licenciatura en ciencias biológicas 2020-12-27 amanda roberts female 35 7243 antonio carboni staylor@hotmail.com +universidad del salvador arquitectura 2020-12-27 omar baldwin male 25 1643 beccar richard61@yahoo.com +universidad del salvador licenciatura en terapia ocupacional 2020-12-27 david kaiser male 27 3515 capitan solari leroydavis@gmail.com +universidad del salvador medicina 2020-12-27 richard banks male 33 9213 cañadon caliente gmorris@yahoo.com +universidad del salvador licenciatura en producción de bioimagenes 2020-12-27 logan lawrence male 33 5743 la isabel hamiltonsteven@gmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-12-27 charles bautista male 18 3486 villa olivari colemanmichael@gmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-12-27 david cox male 25 9007 el jaguel daltonstacey@hotmail.com +universidad del salvador licenciatura en ciencias de la educación 2020-12-27 tracy parker female 21 4750 agua colorada qperkins@gmail.com +universidad del salvador ingeniería mecánica 2020-12-27 caitlin long female 19 1621 benavidez jennifer24@gmail.com +universidad del salvador licenciatura en musicoterapia 2020-12-27 sara diaz female 31 3418 bartolome mitre ambermartin@gmail.com +universidad del salvador licenciatura en ciencia política 2020-12-27 sheri fitzgerald female 27 2521 iturraspe taylorobrien@gmail.com +universidad del salvador licenciatura en psicología 2020-12-28 anthony clements male 39 3705 10 de mayo josephhale@hotmail.com +universidad del salvador contador público 2020-12-28 kristie shaffer female 25 6030 edmundo perkins rebeccahouston@hotmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2020-12-28 jacob dodson male 27 5475 agua de la piedra andrea35@yahoo.com +universidad del salvador contador público 2020-12-28 gabriel alexander male 19 2123 campo calvo robert79@hotmail.com +universidad del salvador licenciatura en ciencias biológicas 2020-12-28 lori moore female 37 2170 candelaria sud brianrivers@gmail.com +universidad del salvador licenciatura en ciencia política 2020-12-28 alexander simmons male 37 6383 campo moises seccion 1a betty02@yahoo.com +universidad del salvador licenciatura en artes 2020-12-28 dana hartman female 29 4431 aguas calientes williamramos@hotmail.com +universidad del salvador actuario 2020-12-28 jose thompson male 35 5444 ampacama hutchinsonkaren@hotmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-12-28 lisa bennett female 21 3056 campo coubert maxwelllauren@hotmail.com +universidad del salvador licenciatura en producción de bioimagenes 2020-12-28 regina hutchinson female 19 6616 castilla simpsonmichelle@hotmail.com +universidad del salvador licenciatura en ciencias de la educación 2020-12-28 meagan jones female 37 1640 acassuso theodoremoore@yahoo.com +universidad del salvador bioquímica 2020-12-29 laura hernandez female 33 5719 agua amarga smiller@gmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2020-12-29 edgar stuart male 39 6652 olascoaga ostephens@gmail.com +universidad del salvador licenciatura en administración 2020-12-29 darlene estrada female 23 3557 caraguatay dylan54@gmail.com +universidad del salvador licenciatura en sociología 2020-12-29 william carter male 33 1888 florencio varela amcclure@gmail.com +universidad del salvador licenciatura en ciencia política 2020-12-29 stephanie harris female 31 6230 francisco casal josephrogers@gmail.com +universidad del salvador licenciatura en artes 2020-12-29 teresa reed female 29 5471 agua blanca gjohnson@gmail.com +universidad del salvador licenciatura en ciencias antropológicas 2020-12-29 kevin jenkins male 37 1763 virrey del pino jacqueline90@yahoo.com +universidad del salvador diseño industrial 2020-12-29 hannah guerrero female 27 1917 luis chico bryanhowell@gmail.com +universidad del salvador licenciatura en musicoterapia 2020-12-29 timothy moreno male 17 3380 9 de julio kilometro 20 petersonchristian@yahoo.com +universidad del salvador licenciatura en terapia ocupacional 2020-12-29 paula davis female 39 8345 alumine rebecca60@yahoo.com +universidad del salvador licenciatura en ciencias ambientales 2020-12-29 nancy white female 23 1735 el durazno yleon@gmail.com +universidad del salvador bioquímica 2020-12-30 karen bell female 35 6417 casbas jameshowe@gmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2020-12-30 cynthia roberts female 31 7536 estacion coronel pringles urodriguez@hotmail.com +universidad del salvador farmacia 2020-12-30 brenda ramos female 19 7106 las toninas smorgan@yahoo.com +universidad del salvador actuario 2020-12-30 jessica smith female 31 6221 ceballos walkerchristopher@hotmail.com +universidad del salvador licenciatura en ciencias de la computación 2020-12-30 richard mcknight male 39 3027 la pelada moorewendy@gmail.com +universidad del salvador licenciatura en producción de bioimagenes 2020-12-30 donald mercer male 23 6405 30 de agosto ryan73@yahoo.com +universidad del salvador licenciatura en terapia ocupacional 2020-12-30 jennifer stone female 25 5503 paso de los andes annbass@hotmail.com +universidad del salvador licenciatura en producción de bioimagenes 2020-12-30 matthew henderson male 23 7108 costa del este samuelhodge@hotmail.com +universidad del salvador licenciatura en ciencia política 2020-12-30 charles davis male 27 5380 chamical stephen62@hotmail.com +universidad del salvador ingeniería electrónica 2020-12-31 andrew arroyo male 18 2743 arroyo dulce charles81@gmail.com +universidad del salvador licenciatura en musicoterapia 2020-12-31 michael wright male 33 8370 caminera welchrandy@hotmail.com +universidad del salvador contador público 2020-12-31 tracy brown female 21 1623 barrio garin norte yflowers@gmail.com +universidad del salvador técnico para bioterios 2020-12-31 christopher morales male 37 6389 alegria kpark@hotmail.com +universidad del salvador licenciatura en relaciones del trabajo 2020-12-31 rodney garcia male 23 5881 cañada la negra katie74@gmail.com +universidad del salvador ingeniería electrónica 2020-12-31 theresa thompson female 31 2121 perez allenmichelle@gmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2020-12-31 melissa wiley female 19 2535 el trebol warebrittany@hotmail.com +universidad del salvador diseño industrial 2020-12-31 jennifer williams female 35 5592 el carbalino xhurst@hotmail.com +universidad del salvador ciencias veterinarias 2020-12-31 nancy lewis female 39 5381 bella vista theresamorales@yahoo.com +universidad del salvador licenciatura en ciencia política 2020-12-31 jamie carpenter female 33 8373 alianza dclark@yahoo.com +universidad del salvador licenciatura en ciencias antropológicas 2021-01-01 charles marsh male 37 6075 arenaza marqueztimothy@gmail.com +universidad del salvador diseño industrial 2021-01-01 jennifer abbott female 21 3423 arañita cassandrajones@gmail.com +universidad del salvador bioquímica 2021-01-01 bradley lee male 23 7513 adolfo gonzales chaves kevinparks@gmail.com +universidad del salvador contador público 2021-01-01 joseph elliott male 23 8415 arroyo las minas keith02@gmail.com +universidad del salvador actuario 2021-01-01 erin luna female 17 8520 aguada del loro jenniferburke@gmail.com +universidad del salvador licenciatura en ciencias ambientales 2021-01-01 james schmidt male 27 5385 aguadita adamsmichele@gmail.com +universidad del salvador licenciatura en ciencias de la computación 2021-01-01 julian chavez male 29 2173 campo pesoa shawrebecca@yahoo.com +universidad del salvador licenciatura en psicología 2021-01-01 leslie gallagher female 23 5771 alanices christina46@yahoo.com +universidad del salvador licenciatura en ciencias geológicas 2021-01-01 shawn alvarado male 37 7406 aldecon kellyyang@yahoo.com +universidad del salvador ingeniería mecánica 2021-01-01 shelby reed female 21 3474 chavarria christine71@gmail.com +universidad del salvador licenciatura en ciencias de la computación 2021-01-01 barbara smith female 29 1771 mercado central epeters@hotmail.com +universidad del salvador diseño de imagen y sonido 2021-01-01 alan blanchard male 39 3572 campo garabato deanthomas@hotmail.com +universidad del salvador actuario 2021-01-01 taylor thomas male 39 8170 abra de hinojo thompsonrichard@gmail.com +universidad del salvador diseño industrial 2021-01-02 shawn cain male 27 8334 ingeniero huergo cheneric@yahoo.com +universidad del salvador licenciatura en ciencias antropológicas 2021-01-02 maria manning female 35 4648 barrio la union dianecruz@yahoo.com +universidad del salvador licenciatura en musicoterapia 2021-01-02 aaron burke male 22 2218 carrizales nathaniel14@gmail.com +universidad del salvador técnico para bioterios 2021-01-02 kaylee diaz female 29 5266 chichagasta brendahernandez@yahoo.com +universidad del salvador farmacia 2021-01-02 donald hall male 27 5331 andalucia patricia33@hotmail.com +universidad del salvador ciencias veterinarias 2021-01-02 adrienne levy female 25 8181 azopardo tylerhall@yahoo.com +universidad del salvador agronomía 2021-01-02 joshua farrell male 27 2214 aldao birderica@hotmail.com +universidad del salvador licenciatura en terapia ocupacional 2021-01-02 kevin jimenez male 37 7265 cazon lbradford@hotmail.com +universidad del salvador licenciatura en ciencias de la computación 2021-01-02 michael gibbs male 23 9053 aguada grande kennethwest@gmail.com +universidad del salvador farmacia 2021-01-03 richard griffin male 33 3583 isla tigre clintonthomas@yahoo.com +universidad del salvador contador público 2021-01-03 amanda garcia female 23 4648 barrio la union lori54@gmail.com +universidad del salvador licenciatura en ciencias geológicas 2021-01-03 jonathan herrera male 25 5775 bajo grande natalie43@yahoo.com +universidad del salvador licenciatura en terapia ocupacional 2021-01-03 james acevedo male 37 4605 alisos de abajo currykristina@hotmail.com +universidad del salvador licenciatura en ciencias de la educación 2021-01-03 julie mcdaniel female 25 3216 arroyo hondo benjamin37@hotmail.com +universidad del salvador ciencias veterinarias 2021-01-03 randall robinson male 21 3481 angostura crystalvelasquez@gmail.com +universidad del salvador ingeniería en informática 2021-01-03 sierra bauer female 29 3574 capilla guadalupe norte ortegamichael@yahoo.com +universidad del salvador licenciatura en ciencias geológicas 2021-01-03 erika parker female 31 6239 gonzalez moreno reyessara@hotmail.com +universidad del salvador licenciatura en artes 2021-01-03 crystal bennett female 23 1629 almirante irizar mollyporter@hotmail.com +universidad del salvador ingeniería en informática 2021-01-03 robert buchanan male 37 2449 avena laura48@gmail.com +universidad del salvador contador público 2021-01-03 gregory maxwell male 25 5421 la tranca danielreynolds@hotmail.com +universidad del salvador bioquímica 2021-01-04 kelly martin female 21 3476 el remanso beth74@yahoo.com +universidad del salvador licenciatura en ciencias biológicas 2021-01-04 lucas webster male 25 6461 capitan castro cristian06@hotmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2021-01-04 brian sanders male 25 2241 larrechea tiffany12@yahoo.com +universidad del salvador licenciatura en ciencias geológicas 2021-01-04 marvin medina male 19 3085 pilar sheilapugh@gmail.com +universidad del salvador licenciatura en ciencias de la educación 2021-01-04 stephen wagner male 17 5401 barrio el tontal sean72@gmail.com +universidad del salvador licenciatura en musicoterapia 2021-01-04 charles vega male 33 8503 chocori jeanne36@hotmail.com +universidad del salvador actuario 2021-01-04 jeremy campbell male 39 2407 campo clucellas jessica22@hotmail.com +universidad del salvador licenciatura en ciencias de la computación 2021-01-04 amy smith female 27 3080 colonia pujol ijohnson@gmail.com +universidad del salvador arquitectura 2021-01-04 richard brooks male 33 1909 arana lesliechandler@yahoo.com +universidad del salvador licenciatura en ciencia política 2021-01-04 kirsten ferguson female 26 5517 cespedes christopherhall@hotmail.com +universidad del salvador ingeniería en informática 2021-01-04 eric greene male 31 1849 claypole janicerobertson@gmail.com +universidad del salvador licenciatura en terapia ocupacional 2021-01-04 robert dean male 21 2409 estrada ronald73@gmail.com +universidad del salvador contador público 2021-01-04 vicki hawkins female 26 2315 estacion saguier kelseyperry@gmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2021-01-04 william moore male 29 6237 america vholmes@yahoo.com +universidad del salvador licenciatura en sociología 2021-01-04 lisa hayes female 33 3382 colonia cunci jgraham@hotmail.com +universidad del salvador arquitectura 2021-01-04 patrick harper male 17 3553 colonia duran ybond@hotmail.com +universidad del salvador ingeniería en informática 2021-01-04 donald barton male 27 1642 san isidro cameron82@gmail.com +universidad del salvador licenciatura en sociología 2021-01-04 laura reese female 25 1612 ingeniero adolfo sourdeaux dominique68@hotmail.com +universidad del salvador ciencias veterinarias 2021-01-04 kimberly williams female 33 2128 arroyo seco heather24@hotmail.com +universidad del salvador licenciatura en ciencias biológicas 2021-01-04 brooke lee female 19 3014 angel gallardo zjones@yahoo.com +universidad del salvador contador público 2021-01-04 robert gonzalez male 39 6531 algarrobo jose28@gmail.com +universidad del salvador diseño de imagen y sonido 2021-01-05 marissa white female 25 5503 paso de los andes nicholaslane@yahoo.com +universidad del salvador ingeniería en informática 2021-01-05 kevin sanchez male 37 2745 gahan noahdunn@yahoo.com +universidad del salvador agronomía 2021-01-05 shelby johnson female 17 8138 anzoategui geoffreyfleming@gmail.com +universidad del salvador actuario 2021-01-05 nancy daniels female 25 3267 cañada de las ovejas phyllis56@gmail.com +universidad del salvador licenciatura en musicoterapia 2021-01-05 larry wang male 29 5743 la isabel shunt@yahoo.com +universidad del salvador licenciatura en ciencias de la computación 2021-01-05 terry osborn male 39 2751 almacen castro zrowe@hotmail.com +universidad del salvador actuario 2021-01-05 terry aguilar female 17 3507 la eduvigis bmcguire@yahoo.com +universidad del salvador licenciatura en musicoterapia 2021-01-05 stephen nicholson male 37 5304 el tala wilkinsonebony@gmail.com +universidad del salvador licenciatura en ciencias antropológicas 2021-01-05 crystal baxter female 25 3316 arroyo pastora youngkevin@hotmail.com +universidad del salvador licenciatura en ciencias de la computación 2021-01-05 ryan lewis male 33 3123 aldea santa maria kkent@gmail.com +universidad del salvador licenciatura en ciencias de la educación 2021-01-05 sylvia proctor female 25 8506 bahia san blas qbell@yahoo.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2021-01-05 terry stewart female 19 6323 algarrobo del aguila michael23@gmail.com +universidad del salvador medicina 2021-01-05 ashley orr female 23 1752 lomas del mirador tyler04@hotmail.com +universidad del salvador medicina 2021-01-06 carolyn wong female 27 6228 aguas buenas eeaton@yahoo.com +universidad del salvador bioquímica 2021-01-06 laura jones female 25 1648 rincon de milberg donald97@hotmail.com +universidad del salvador licenciatura en musicoterapia 2021-01-06 ryan acosta male 37 1917 luis chico madisonwoods@gmail.com +universidad del salvador ingeniería electrónica 2021-01-06 david collins male 22 2848 berisso pamelabenjamin@gmail.com +universidad del salvador ingeniería en informática 2021-01-06 donna moreno female 26 6701 carlos keen upittman@yahoo.com +universidad del salvador diseño industrial 2021-01-06 devin lewis male 37 5553 empalme frontera margaret60@gmail.com +universidad del salvador farmacia 2021-01-06 crystal bowman female 19 4651 agua de castilla jonathan51@gmail.com +universidad del salvador agronomía 2021-01-06 nicole ware female 37 3032 nelson cwilliams@hotmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2021-01-06 scott mitchell male 19 6616 castilla nataliestevenson@hotmail.com +universidad del salvador licenciatura en ciencias antropológicas 2021-01-06 tammy wiggins female 35 5589 chapanay sarahwilson@yahoo.com +universidad del salvador licenciatura en producción de bioimagenes 2021-01-06 jennifer clark female 17 2204 jesus maria john42@gmail.com +universidad del salvador agronomía 2021-01-06 nichole flores female 23 3200 colonia los sauces collinsstephen@gmail.com +universidad del salvador arquitectura 2021-01-06 erika howard female 37 3474 chavarria butlerann@yahoo.com +universidad del salvador licenciatura en ciencias geológicas 2021-01-07 brian jones male 21 3361 acaragua lopeztoni@hotmail.com +universidad del salvador licenciatura en ciencias geológicas 2021-01-07 kelly young female 22 8532 arroyo salado rodgerschristopher@yahoo.com +universidad del salvador ingeniería electrónica 2021-01-07 samantha sharp female 26 4242 25 de mayo vargaserica@gmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2021-01-07 kathryn bates female 18 2909 estancias millernicole@yahoo.com +universidad del salvador licenciatura en ciencias de la educación 2021-01-07 deborah king female 35 8514 laguna del barro ycampos@gmail.com +universidad del salvador ingeniería electrónica 2021-01-07 andrea torres female 29 1746 francisco alvarez robertsmith@yahoo.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2021-01-07 sandra palmer female 29 1757 gregorio de laferrere davidbentley@hotmail.com +universidad del salvador licenciatura en ciencias geológicas 2021-01-07 jeremy lowe male 39 4640 abra pampa garrisonpenny@yahoo.com +universidad del salvador licenciatura en ciencia política 2021-01-07 kelly cohen female 33 2520 la california dawn60@gmail.com +universidad del salvador licenciatura en ciencias biológicas 2021-01-07 terry monroe male 21 4701 acostilla simscarolyn@gmail.com +universidad del salvador arquitectura 2021-01-07 daniel bryant male 23 8115 bajo hondo bonniewhitney@yahoo.com +universidad del salvador licenciatura en ciencias antropológicas 2021-01-07 melissa young female 20 8181 azopardo jaredrobles@hotmail.com +universidad del salvador licenciatura en ciencias antropológicas 2021-01-07 michael perez male 19 7517 juan e barra smithmichelle@hotmail.com +universidad del salvador licenciatura en sociología 2021-01-07 patricia gross female 21 3155 costa del nogoya lisashepherd@gmail.com +universidad del salvador licenciatura en ciencias ambientales 2021-01-08 natasha chan female 17 5701 11 de mayo swood@gmail.com +universidad del salvador diseño industrial 2021-01-08 karen woodward female 39 4506 alegria randallcasey@hotmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2021-01-08 mark hill male 23 6065 blaquier hjordan@gmail.com +universidad del salvador licenciatura en sociología 2021-01-08 linda anderson female 25 6743 coliqueo jennifer80@yahoo.com +universidad del salvador licenciatura en musicoterapia 2021-01-08 sierra casey female 31 2119 arminda wallerpatrick@gmail.com +universidad del salvador licenciatura en relaciones del trabajo 2021-01-08 linda goodwin female 39 2529 piamonte dixonchristina@yahoo.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2021-01-08 mercedes williams female 23 6213 lote 11 escuela 107 ryates@hotmail.com +universidad del salvador licenciatura en ciencia política 2021-01-08 sarah larson female 37 5579 barrio lencina petersonjanet@gmail.com +universidad del salvador licenciatura en relaciones del trabajo 2021-01-08 claudia sullivan female 33 1825 monte chingolo plambert@hotmail.com +universidad del salvador diseño industrial 2021-01-08 jack ryan male 35 5343 lavalle woodmelvin@yahoo.com +universidad del salvador farmacia 2021-01-08 robert davis male 37 3540 avanzada nlawson@gmail.com +universidad del salvador agronomía 2021-01-08 scott lewis male 19 6431 estacion lago epecuen brownmary@hotmail.com +universidad del salvador licenciatura en ciencias ambientales 2021-01-08 lisa rivera female 17 8311 villa el chocon daniel42@gmail.com +universidad del salvador licenciatura en ciencias de la computación 2021-01-08 anthony wall male 27 4608 alto verde johnsonmarvin@yahoo.com +universidad del salvador farmacia 2021-01-09 nicholas cisneros male 25 5353 el zapallar rodneycooley@hotmail.com +universidad del salvador licenciatura en psicología 2021-01-09 alex simpson male 27 9023 buen pasto leonard70@yahoo.com +universidad del salvador ingeniería en informática 2021-01-09 austin kline male 25 4237 cortaderas duncanjeffrey@hotmail.com +universidad del salvador licenciatura en ciencias geológicas 2021-01-09 elizabeth stone female 21 1744 cuartel v nvillanueva@hotmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2021-01-09 sarah webb female 27 3483 arroyo balmaceda jeffreyrogers@yahoo.com +universidad del salvador licenciatura en ciencias antropológicas 2021-01-09 jerry edwards male 27 3322 aparicio cue jsimmons@gmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2021-01-09 julie rose female 39 2400 villani vfox@hotmail.com +universidad del salvador ingeniería electrónica 2021-01-09 leah moreno female 35 6720 kilometro 125 sjones@gmail.com +universidad del salvador ingeniería electrónica 2021-01-09 kenneth rodgers male 31 1901 estacion moreno seanhunter@hotmail.com +universidad del salvador actuario 2021-01-10 taylor harmon female 33 2705 haras san jacinto hendricksgary@gmail.com +universidad del salvador agronomía 2021-01-10 beth anderson female 19 3222 buen retiro weavermaureen@gmail.com +universidad del salvador diseño industrial 2021-01-10 valerie swanson female 31 2916 el jupiter kimberly05@hotmail.com +universidad del salvador licenciatura en sociología 2021-01-10 evelyn woods female 37 4600 algarrobal pjohnson@yahoo.com +universidad del salvador licenciatura en terapia ocupacional 2021-01-10 tyler walker male 37 6600 kilometro 125 kellirivera@gmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2021-01-10 douglas nguyen male 35 7003 aceilan valerie00@hotmail.com +universidad del salvador actuario 2021-01-10 elizabeth yates female 37 5385 aguadita steventhomas@gmail.com +universidad del salvador diseño de imagen y sonido 2021-01-11 jordan stein female 35 4648 barrio la union xroberts@yahoo.com +universidad del salvador licenciatura en musicoterapia 2021-01-11 patricia bennett female 19 6230 francisco casal karen85@gmail.com +universidad del salvador ingeniería en informática 2021-01-11 travis kelley male 25 6743 coliqueo michael43@hotmail.com +universidad del salvador licenciatura en ciencias de la educación 2021-01-11 richard king male 29 4605 alisos de abajo hkoch@yahoo.com +universidad del salvador licenciatura en ciencias antropológicas 2021-01-11 lynn larson female 35 8379 gente grande katherine10@yahoo.com +universidad del salvador diseño industrial 2021-01-11 john munoz male 35 3445 9 de julio arthur66@gmail.com +universidad del salvador farmacia 2021-01-11 dale acosta male 27 5590 adrian maturano kennedyapril@yahoo.com +universidad del salvador bioquímica 2021-01-11 jonathan mcclure male 35 7003 aceilan raymonddavenport@gmail.com +universidad del salvador diseño industrial 2021-01-11 anna bray female 26 9015 alma grande bowmanstephanie@hotmail.com +universidad del salvador licenciatura en ciencias biológicas 2021-01-11 jamie palmer female 35 3532 curandu amy18@gmail.com +universidad del salvador medicina 2021-01-11 janet burke female 37 6703 alastuey browncrystal@gmail.com +universidad del salvador licenciatura en psicología 2021-01-11 heidi wood female 39 5645 el cenizo holsen@hotmail.com +universidad del salvador ingeniería electrónica 2021-01-12 deborah barry female 39 7245 campo sabate ehunt@hotmail.com +universidad del salvador ingeniería electrónica 2021-01-12 tony figueroa male 27 1834 temperley michelewilliams@gmail.com +universidad del salvador licenciatura en relaciones del trabajo 2021-01-12 connor myers male 27 3232 cabred christophergonzalez@yahoo.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2021-01-12 valerie robinson female 27 3136 alcaraz norte matthewramirez@yahoo.com +universidad del salvador licenciatura en kinesiología y fisiatría 2021-01-12 kimberly allen female 25 3516 basail angela43@yahoo.com +universidad del salvador licenciatura en terapia ocupacional 2021-01-12 monica goodwin female 21 5503 paso de los andes garroyo@yahoo.com +universidad del salvador licenciatura en psicología 2021-01-12 daniel campbell male 21 5343 lavalle martin19@gmail.com +universidad del salvador técnico para bioterios 2021-01-12 paul cox male 37 7243 antonio carboni david15@yahoo.com +universidad del salvador licenciatura en sociología 2021-01-12 mackenzie williams female 33 3522 el retiro nhampton@gmail.com +universidad del salvador licenciatura en producción de bioimagenes 2021-01-12 julie carter female 37 2806 las palmas andrewagner@yahoo.com +universidad del salvador licenciatura en sociología 2021-01-12 donna david female 39 3003 colonia los zapallos jacob43@hotmail.com +universidad del salvador licenciatura en ciencia política 2021-01-13 william smith male 37 3400 bañado norte farrellnatasha@gmail.com +universidad del salvador licenciatura en ciencia política 2021-01-13 eric todd male 25 8136 algarrobo john50@hotmail.com +universidad del salvador licenciatura en sociología 2021-01-13 holly ryan female 21 6472 francisco madero pottsemma@gmail.com +universidad del salvador actuario 2021-01-13 jennifer hale female 25 3036 aromos katherinecarey@yahoo.com +universidad del salvador contador público 2021-01-13 steven smith male 31 8201 25 de mayo jason52@gmail.com +universidad del salvador farmacia 2021-01-13 jeremy dunlap male 23 7547 cascada ashley15@gmail.com +universidad del salvador ingeniería mecánica 2021-01-13 john patterson male 25 3231 colonia arocena ina thomasscott@hotmail.com +universidad del salvador licenciatura en ciencia política 2021-01-13 timothy brown male 25 7519 san mayol reedkimberly@yahoo.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2021-01-13 troy wallace male 17 3226 buena vista salazarjames@gmail.com +universidad del salvador licenciatura en ciencias geológicas 2021-01-14 betty bell female 25 7001 la pastora andrew40@hotmail.com +universidad del salvador ciencias veterinarias 2021-01-14 andrew montgomery male 17 2914 costa brava kelly23@hotmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2021-01-14 nathan payne male 37 3001 alto verde michaelsmith@yahoo.com +universidad del salvador ingeniería mecánica 2021-01-14 diane pierce female 17 1612 ingeniero adolfo sourdeaux melissa63@yahoo.com +universidad del salvador ciencias veterinarias 2021-01-14 brian padilla male 37 6381 campo caretto gina16@hotmail.com +universidad del salvador licenciatura en psicología 2021-01-14 kimberly golden female 23 3220 arroyo manganga jamesbradshaw@yahoo.com +universidad del salvador licenciatura en terapia ocupacional 2021-01-14 john ward male 37 8183 avestruz chadwilliams@gmail.com +universidad del salvador licenciatura en ciencias geológicas 2021-01-14 robert washington male 23 2445 cristolia melissaphillips@gmail.com +universidad del salvador licenciatura en musicoterapia 2021-01-14 regina munoz female 19 3116 aldea chaleco sarahmaxwell@hotmail.com +universidad del salvador diseño de imagen y sonido 2021-01-14 gregory luna male 31 2529 piamonte jason78@hotmail.com +universidad del salvador ciencias veterinarias 2021-01-14 stephanie rose female 33 2914 costa brava michael72@yahoo.com +universidad del salvador actuario 2021-01-14 sarah gonzales female 27 4616 barcena figueroarichard@yahoo.com +universidad del salvador licenciatura en ciencias de la educación 2021-01-14 robert lucas male 17 4616 barcena james05@yahoo.com +universidad del salvador licenciatura en ciencias de la computación 2021-01-15 david harrington male 23 6337 ingeniero thompson alexanderdavid@hotmail.com +universidad del salvador contador público 2021-01-15 joseph smith male 19 3129 colonia hernandarias braycheryl@hotmail.com +universidad del salvador licenciatura en producción de bioimagenes 2021-01-15 natalie baxter female 19 8360 buena esperanza frederick05@gmail.com +universidad del salvador actuario 2021-01-15 donna morrison female 29 4603 catamontaña dennis36@hotmail.com +universidad del salvador licenciatura en terapia ocupacional 2021-01-15 sydney price female 27 6346 pellegrini singletonjoshua@yahoo.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2021-01-15 christy burke female 21 3461 abo nezu valerie17@gmail.com +universidad del salvador medicina 2021-01-15 nancy ward female 25 1748 general rodriguez edwardcooper@hotmail.com +universidad del salvador licenciatura en terapia ocupacional 2021-01-15 susan johnson female 25 8324 cipolletti mkramer@gmail.com +universidad del salvador licenciatura en sociología 2021-01-15 kevin holt male 19 6551 juan f ibarra mschmidt@hotmail.com +universidad del salvador licenciatura en ciencias geológicas 2021-01-15 matthew lewis male 33 3712 los frentones malik58@gmail.com +universidad del salvador licenciatura en administración 2021-01-15 erica chang female 35 8316 balsa senillosa michaelshields@yahoo.com +universidad del salvador ciencias veterinarias 2021-01-16 rachel hughes female 26 4713 ocho vados adrian35@gmail.com +universidad del salvador farmacia 2021-01-16 timothy warren male 37 6317 la florencia johnsonsheena@yahoo.com +universidad del salvador licenciatura en ciencias antropológicas 2021-01-16 james anderson male 23 1688 villa santos tesei karen32@hotmail.com +universidad del salvador diseño de imagen y sonido 2021-01-16 brittany griffin female 25 2147 san genaro norte johnarias@hotmail.com +universidad del salvador licenciatura en artes 2021-01-16 joseph novak male 35 2805 arroyo aleli ryan08@hotmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2021-01-16 sarah young female 31 5611 agua rica rwhite@gmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2021-01-16 rachel harris female 37 5515 maipu mccarthyfernando@yahoo.com +universidad del salvador ingeniería mecánica 2021-01-16 jeffrey foster male 33 5409 adan quiroga ubennett@gmail.com +universidad del salvador contador público 2021-01-16 troy rogers male 19 5421 la tranca ronald06@gmail.com +universidad del salvador técnico para bioterios 2021-01-16 marcus holland male 33 6643 araujo walkerscott@hotmail.com +universidad del salvador ingeniería en informática 2021-01-16 wendy jensen female 25 2943 ireneo portela becky66@hotmail.com +universidad del salvador licenciatura en administración 2021-01-16 rebecca pugh female 19 1727 b los aromos san patricio alishaenglish@yahoo.com +universidad del salvador licenciatura en ciencias ambientales 2021-01-16 katherine lane female 25 6352 colonia la india brangel@gmail.com +universidad del salvador licenciatura en relaciones del trabajo 2021-01-17 mark mccoy male 23 3285 berduc snydersara@yahoo.com +universidad del salvador técnico para bioterios 2021-01-17 krystal rodriguez female 19 6063 porvenir hhall@gmail.com +universidad del salvador agronomía 2021-01-17 gina lee female 37 3357 barra bonita karenroberson@gmail.com +universidad del salvador licenciatura en ciencias biológicas 2021-01-17 kristy cooper female 21 1752 lomas del mirador kevin16@yahoo.com +universidad del salvador licenciatura en administración 2021-01-17 angela davis female 31 1854 longchamps phillip46@gmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2021-01-17 rebecca nielsen female 27 4723 alijilan oliviareynolds@hotmail.com +universidad del salvador diseño industrial 2021-01-17 paul graham male 35 4655 cabreria gregory66@gmail.com +universidad del salvador bioquímica 2021-01-17 katherine nelson female 29 4146 barrio belgrano yclayton@hotmail.com +universidad del salvador bioquímica 2021-01-17 kevin robinson male 21 3066 campo garay gonzaleselizabeth@yahoo.com +universidad del salvador diseño industrial 2021-01-17 steven wilkinson male 23 6453 carlos salas uanderson@gmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2021-01-17 margaret villanueva female 39 8501 bahia creek raven83@yahoo.com +universidad del salvador licenciatura en ciencias de la computación 2021-01-18 cynthia williams female 31 5303 anjullon johnsontravis@gmail.com +universidad del salvador licenciatura en sociología 2021-01-18 martha brown female 23 6309 alpachiri hmcgee@gmail.com +universidad del salvador ingeniería en informática 2021-01-18 james whitaker male 23 7612 camet greenjuan@hotmail.com +universidad del salvador licenciatura en ciencia política 2021-01-18 nicole williams female 19 8415 arroyo las minas lisacantu@hotmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2021-01-18 dustin stewart male 17 6034 colonia alberdi simmonseileen@hotmail.com +universidad del salvador licenciatura en terapia ocupacional 2021-01-18 susan johnson female 23 3318 bonpland norte brownjake@gmail.com +universidad del salvador farmacia 2021-01-18 gary chang male 27 6550 bolivar regina51@yahoo.com +universidad del salvador licenciatura en psicología 2021-01-18 gregory adams male 26 4616 barcena awilliams@gmail.com +universidad del salvador licenciatura en ciencia política 2021-01-19 mark griffin male 27 5411 la legua mcbriderebecca@yahoo.com +universidad del salvador licenciatura en administración 2021-01-19 nicholas johnston male 25 1704 ramos mejia brandonburton@hotmail.com +universidad del salvador licenciatura en ciencias biológicas 2021-01-19 zachary jenkins male 19 2946 el espinillo batesnorma@gmail.com +universidad del salvador técnico para bioterios 2021-01-19 kathryn clark female 35 1629 almirante irizar holly98@hotmail.com +universidad del salvador ingeniería en informática 2021-01-19 patrick hill male 23 6601 altamira jacob66@gmail.com +universidad del salvador licenciatura en ciencias de la educación 2021-01-19 chad garcia male 17 1649 zona delta tigre omiller@hotmail.com +universidad del salvador actuario 2021-01-19 megan bradley female 31 5587 barcala destiny55@yahoo.com +universidad del salvador licenciatura en kinesiología y fisiatría 2021-01-19 kristen johnson female 37 3076 huanqueros fitzpatrickeric@gmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2021-01-19 melissa romero female 39 5585 el cipres nicholaschandler@gmail.com +universidad del salvador ciencias veterinarias 2021-01-19 renee patrick female 31 3706 avia terai williamgay@yahoo.com +universidad del salvador licenciatura en producción de bioimagenes 2021-01-20 stephen taylor male 27 7511 balneario oceano wendylong@hotmail.com +universidad del salvador licenciatura en relaciones del trabajo 2021-01-20 kimberly davenport female 31 9100 cerro santa ana mclaughlincindy@gmail.com +universidad del salvador arquitectura 2021-01-20 derrick hammond male 27 9217 cholila jamietanner@hotmail.com +universidad del salvador actuario 2021-01-20 stacey duran female 37 3560 campo ubajo greenesteven@hotmail.com +universidad del salvador farmacia 2021-01-20 carl kramer male 19 2352 ambrosetti kristopher60@gmail.com +universidad del salvador técnico para bioterios 2021-01-20 sandy beltran female 17 7009 iraola murphyjennifer@gmail.com +universidad del salvador licenciatura en psicología 2021-01-20 chelsea smith female 29 1766 tablada nicolewallace@hotmail.com +universidad del salvador bioquímica 2021-01-20 sheryl heath female 27 1640 acassuso iruiz@yahoo.com +universidad del salvador ciencias veterinarias 2021-01-20 heidi garcia female 37 5555 puente del inca loriholmes@yahoo.com +universidad del salvador licenciatura en artes 2021-01-20 william taylor male 37 7208 coronel boerr whitedanielle@yahoo.com +universidad del salvador arquitectura 2021-01-20 lance dyer male 27 7163 claverie duanemarquez@gmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2021-01-20 todd cohen male 39 7163 claverie john29@hotmail.com +universidad del salvador licenciatura en ciencias de la computación 2021-01-20 megan price female 31 6612 capdepont gabriel10@hotmail.com +universidad del salvador licenciatura en terapia ocupacional 2021-01-20 bailey caldwell female 37 8506 bahia san blas allenkara@gmail.com +universidad del salvador licenciatura en sociología 2021-01-21 gary kennedy male 24 9051 aguada a pique umarquez@yahoo.com +universidad del salvador diseño de imagen y sonido 2021-01-21 shannon skinner female 31 1761 20 de junio garrettmoore@gmail.com +universidad del salvador licenciatura en ciencias ambientales 2021-01-21 richard ingram male 21 6701 carlos keen mortonsarah@gmail.com +universidad del salvador licenciatura en sociología 2021-01-21 linda brown female 27 8164 arquedas vbailey@yahoo.com +universidad del salvador diseño industrial 2021-01-21 megan herrera female 27 1836 llavallol zchapman@hotmail.com +universidad del salvador licenciatura en producción de bioimagenes 2021-01-21 andrea goodman female 26 2761 estancia santa catalina nicolemckay@gmail.com +universidad del salvador licenciatura en ciencias biológicas 2021-01-21 stephen charles male 25 5444 ampacama tanderson@yahoo.com +universidad del salvador diseño industrial 2021-01-21 carol roberson female 35 3076 huanqueros orangel@yahoo.com +universidad del salvador agronomía 2021-01-21 juan burgess male 37 3380 9 de julio kilometro 20 rachellewis@yahoo.com +universidad del salvador contador público 2021-01-21 michelle miller female 29 4631 antiguo shayes@yahoo.com +universidad del salvador licenciatura en kinesiología y fisiatría 2021-01-21 justin harris male 25 3101 aldea brasilera woodsbrian@gmail.com +universidad del salvador agronomía 2021-01-21 eric harrington male 29 2723 estancia las gamas stevenmcmillan@hotmail.com +universidad del salvador licenciatura en ciencias antropológicas 2021-01-21 tanner mccullough male 39 3371 cabure lisa28@yahoo.com +universidad del salvador licenciatura en gestión de agroalimentos 2021-01-22 mariah dean female 21 1884 berazategui zswanson@hotmail.com +universidad del salvador licenciatura en terapia ocupacional 2021-01-22 christopher brown male 26 9221 valle hondo clong@hotmail.com +universidad del salvador licenciatura en ciencias geológicas 2021-01-22 peter bates male 27 4751 agua de dionisio carpentercarl@hotmail.com +universidad del salvador técnico para bioterios 2021-01-22 anita rowe female 17 2117 alcorta michaelfields@gmail.com +universidad del salvador licenciatura en ciencia política 2021-01-22 sarah jones female 29 7531 despeñaderos danielmiller@yahoo.com +universidad del salvador licenciatura en ciencias antropológicas 2021-01-22 jennifer bonilla female 22 6269 la colina coxtimothy@yahoo.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2021-01-22 melissa ward female 21 9315 bajo caracoles erik45@hotmail.com +universidad del salvador licenciatura en administración 2021-01-22 kim carlson female 20 1858 villa numancia tonyjackson@hotmail.com +universidad del salvador contador público 2021-01-23 tammy rios female 25 1621 benavidez hshort@hotmail.com +universidad del salvador ingeniería en informática 2021-01-23 james brown male 24 2185 campo crenna brandon33@gmail.com +universidad del salvador medicina 2021-01-23 sean grimes male 19 5701 11 de mayo jasminehall@hotmail.com +universidad del salvador licenciatura en relaciones del trabajo 2021-01-23 angela myers female 27 3181 arroyo moreira alexanderhinton@hotmail.com +universidad del salvador contador público 2021-01-23 cheryl cain female 25 9223 alto rio pico bellcaitlin@yahoo.com +universidad del salvador licenciatura en ciencias antropológicas 2021-01-23 amy copeland female 17 3592 colonia hardy jeremypotter@hotmail.com +universidad del salvador farmacia 2021-01-23 joseph bennett male 27 1923 arroyo del pescado john96@hotmail.com +universidad del salvador ingeniería mecánica 2021-01-23 mark randall male 33 8319 campamento sol debbiesimpson@hotmail.com +universidad del salvador licenciatura en relaciones del trabajo 2021-01-23 william elliott male 23 5561 ancon rsutton@gmail.com +universidad del salvador actuario 2021-01-23 amy smith female 27 5500 cerro aconcagua andrew80@gmail.com +universidad del salvador licenciatura en artes 2021-01-23 brian pearson male 25 1893 centro agricola el pato owhite@gmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2021-01-23 daniel fox male 25 3123 aldea santa maria william62@gmail.com +universidad del salvador licenciatura en ciencias de la educación 2021-01-23 james reyes male 29 7174 arroyo grande michealrios@gmail.com +universidad del salvador licenciatura en ciencias de la computación 2021-01-24 diane williams female 19 6461 capitan castro cassandra44@hotmail.com +universidad del salvador bioquímica 2021-01-24 darrell holmes male 23 2617 sancti spiritu ujackson@gmail.com +universidad del salvador ingeniería en informática 2021-01-24 hannah williams female 31 3507 la eduvigis amber07@hotmail.com +universidad del salvador licenciatura en artes 2021-01-25 thomas davis male 19 7545 huanguelen clarkalexis@yahoo.com +universidad del salvador contador público 2021-01-25 ruth miller female 25 1669 del viso sabrina79@hotmail.com +universidad del salvador licenciatura en musicoterapia 2021-01-25 brenda henry female 23 2401 castelar bookerchristopher@gmail.com +universidad del salvador licenciatura en musicoterapia 2021-01-25 benjamin stuart male 37 3156 betbeder kathleensanders@yahoo.com +universidad del salvador medicina 2021-01-25 crystal montgomery female 27 4718 barro negro bjordan@gmail.com +universidad del salvador agronomía 2021-01-25 victoria higgins female 27 4631 antiguo websterbradley@yahoo.com +universidad del salvador licenciatura en sociología 2021-01-25 michael henderson male 39 5521 los corredores desireetucker@yahoo.com +universidad del salvador ciencias veterinarias 2021-01-26 cheryl jones female 29 3125 antonio tomas hoffmansandra@hotmail.com +universidad del salvador técnico para bioterios 2021-01-26 rebecca pratt female 23 3071 aguara grande stephaniealexander@hotmail.com +universidad del salvador licenciatura en administración 2021-01-26 tammy fox female 31 3386 caraguatay bgentry@gmail.com +universidad del salvador licenciatura en producción de bioimagenes 2021-01-26 diane clark female 35 9203 aldea escolar yduncan@yahoo.com +universidad del salvador licenciatura en ciencias de la computación 2021-01-26 tracy herrera female 35 6303 cachirulo andreanelson@hotmail.com +universidad del salvador licenciatura en ciencias de la computación 2021-01-26 diana davenport female 27 2722 wheelwright joel88@gmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2021-01-26 renee juarez female 19 1884 berazategui cwu@hotmail.com +universidad del salvador bioquímica 2021-01-26 travis rivers male 23 2000 villa angelica ycastillo@yahoo.com +universidad del salvador licenciatura en ciencias geológicas 2021-01-26 joseph stokes male 26 8532 arroyo salado charlescook@gmail.com +universidad del salvador medicina 2021-01-26 christine rios female 37 5343 lavalle xchapman@hotmail.com +universidad del salvador licenciatura en planificación y diseño del paisaje 2021-01-26 linda reyes female 18 3569 barros pazos millerjohn@hotmail.com +universidad del salvador licenciatura en ciencias biológicas 2021-01-26 marcus reeves male 27 1849 claypole emma33@hotmail.com +universidad del salvador licenciatura en ciencias biológicas 2021-01-26 dave baker male 39 5645 el cenizo nreyes@yahoo.com +universidad del salvador licenciatura en musicoterapia 2021-01-26 kathleen smith female 35 4753 corralito courtneystewart@gmail.com +universidad del salvador actuario 2021-01-26 mitchell gonzalez male 37 6700 caminera lujan jacksonpatricia@gmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2021-01-27 mark burnett male 37 2315 estacion saguier jacksonkatie@hotmail.com +universidad del salvador medicina 2021-01-27 jessica davis female 25 3164 colonia rivas bradley05@hotmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2021-01-27 emily simon female 29 3230 arbol solo xmoore@hotmail.com +universidad del salvador farmacia 2021-01-27 judith mcclain female 23 6660 25 de mayo matapaul@yahoo.com +universidad del salvador licenciatura en ciencias ambientales 2021-01-27 justin martin male 20 3112 colonia loma negra jerry11@hotmail.com +universidad del salvador diseño de imagen y sonido 2021-01-27 kimberly levy female 19 9311 cañadon leon xmccarty@hotmail.com +universidad del salvador licenciatura en ciencias de la educación 2021-01-27 kayla finley female 25 7265 cazon haley55@yahoo.com +universidad del salvador licenciatura en ciencia política 2021-01-27 alexandra perez female 21 3370 planchada banderita beltrankathleen@gmail.com +universidad del salvador ingeniería en informática 2021-01-27 whitney cowan female 33 7208 coronel boerr gperez@yahoo.com +universidad del salvador licenciatura en ciencias antropológicas 2021-01-27 thomas camacho male 31 3425 costa grande ybrown@gmail.com +universidad del salvador diseño de imagen y sonido 2021-01-27 beth farrell female 18 6605 campo peña lopez walkerlisa@hotmail.com +universidad del salvador diseño de imagen y sonido 2021-01-27 thomas rodriguez male 35 3132 el pingo wendy23@hotmail.com +universidad del salvador licenciatura en administración 2021-01-27 lisa bridges female 33 9017 cameron timothyrobinson@hotmail.com +universidad del salvador ciencias veterinarias 2021-01-27 gary reese male 29 3563 colonia san manuel tony25@hotmail.com +universidad del salvador ciencias veterinarias 2021-01-28 crystal anderson female 21 8126 aldea san andres andrewschristopher@gmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2021-01-28 amy davis female 33 4158 campo de talamayo pmiller@yahoo.com +universidad del salvador licenciatura en artes 2021-01-28 joseph patel male 24 4605 alisos de abajo santossusan@gmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2021-01-28 bradley brown male 23 6513 colonia las yescas valeriecraig@yahoo.com +universidad del salvador ingeniería en informática 2021-01-28 kim daniels female 33 3248 caraguata larrywilson@hotmail.com +universidad del salvador arquitectura 2021-01-28 nicole roberts female 37 6612 capdepont gateskatherine@gmail.com +universidad del salvador bioquímica 2021-01-28 bethany trujillo female 25 6223 coronel charlone morenocaleb@gmail.com +universidad del salvador farmacia 2021-01-28 melissa love female 27 1759 gonzalez catan sara98@gmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2021-01-29 rachel wilson female 33 2152 granadero baigorria yolandabaker@gmail.com +universidad del salvador licenciatura en psicología 2021-01-29 randy adkins male 31 3313 arroyo del medio margaretdelacruz@gmail.com +universidad del salvador ingeniería en informática 2021-01-29 kevin calderon male 33 1921 alvarez jonte aday@hotmail.com +universidad del salvador ingeniería electrónica 2021-01-29 abigail newton female 37 8503 chocori paullee@yahoo.com +universidad del salvador diseño de imagen y sonido 2021-01-29 catherine murphy female 29 5560 arroyo claro briannadaniel@gmail.com +universidad del salvador licenciatura en ciencias biológicas 2021-01-29 kathleen fitzpatrick female 27 2000 villa angelica joseph47@gmail.com +universidad del salvador actuario 2021-01-29 nicholas shaw male 19 7003 aceilan marymason@gmail.com +universidad del salvador licenciatura en sociología 2021-01-29 sara ramsey female 29 3700 barrio gral jose de san martin sellersshane@hotmail.com +universidad del salvador arquitectura 2021-01-29 janet wyatt female 17 3056 campo coubert wellsmichael@hotmail.com +universidad del salvador licenciatura en musicoterapia 2021-01-29 charlene allen female 23 1903 abasto odonnelleugene@gmail.com +universidad del salvador diseño industrial 2021-01-30 katelyn ross female 19 2512 campo charo pclarke@yahoo.com +universidad del salvador licenciatura en producción de bioimagenes 2021-01-30 rachael davidson female 26 5711 angelita morrisjerry@gmail.com +universidad del salvador licenciatura en artes 2021-01-30 mariah meyer female 23 5759 calera argentina simpsonbrian@gmail.com +universidad del salvador medicina 2021-01-30 james hampton male 21 5343 lavalle bwood@gmail.com +universidad del salvador ingeniería electrónica 2021-01-30 lisa webb female 26 7633 maori amandacabrera@gmail.com +universidad del salvador licenciatura en psicología 2021-01-30 daniel white male 23 1822 valentin alsina eharris@yahoo.com +universidad del salvador licenciatura en ciencias antropológicas 2021-01-30 leah miller female 19 6228 aguas buenas kristin83@yahoo.com +universidad del salvador ingeniería electrónica 2021-01-30 sarah young female 39 3501 campo de galnasi melissa85@hotmail.com +universidad del salvador contador público 2021-01-30 steven parker male 35 2501 berretta jon09@hotmail.com +universidad del salvador medicina 2021-01-30 joshua li male 29 2643 cafferata harristimothy@yahoo.com +universidad del salvador farmacia 2021-01-30 anthony gutierrez male 25 3425 costa grande anthonyjohnson@yahoo.com +universidad del salvador agronomía 2021-01-30 barbara smith female 17 1755 rafael castillo richardsonmonica@hotmail.com +universidad del salvador licenciatura en ciencia política 2021-01-31 krista adams female 24 5350 el molle hmorgan@yahoo.com +universidad del salvador ingeniería mecánica 2021-01-31 danny crawford male 31 3316 arroyo pastora nmueller@hotmail.com +universidad del salvador licenciatura en administración 2021-01-31 corey thomas male 19 6105 cañada seca ahopkins@hotmail.com +universidad del salvador licenciatura en ciencias de la computación 2021-01-31 joe watts male 23 3103 aldea santafecina dennisdominique@hotmail.com +universidad del salvador licenciatura en gestión de agroalimentos 2021-01-31 kathy lopez female 29 6309 alpachiri murphymanuel@hotmail.com +universidad del salvador farmacia 2021-01-31 meghan nelson female 21 2313 colonia berlin vkhan@hotmail.com +universidad del salvador farmacia 2021-01-31 robert ortega male 25 2115 colonia valdez mcdanielmark@yahoo.com +universidad del salvador licenciatura en artes 2021-01-31 tyler allen male 39 1890 juan maria gutierrez uturner@gmail.com +universidad del salvador licenciatura en relaciones del trabajo 2021-01-31 michelle franklin female 25 8370 caminera qweaver@hotmail.com +universidad del salvador licenciatura en ciencia y tecnología de alimentos 2021-01-31 debbie english female 29 5541 algarrobal abajo lisaflores@hotmail.com +universidad del salvador licenciatura en sociología 2021-02-01 adam brewer male 39 1870 avellaneda lowecatherine@hotmail.com +universidad del salvador ciencias veterinarias 2021-02-01 carmen williams female 18 6223 coronel charlone jrodriguez@yahoo.com +universidad del salvador diseño de imagen y sonido 2021-02-01 jennifer duran female 39 2944 rio tala caitlinyoung@yahoo.com +universidad del salvador licenciatura en musicoterapia 2021-02-01 tyler page male 23 6660 25 de mayo tiffanymurphy@yahoo.com +universidad del salvador licenciatura en ciencias geológicas 2021-02-01 michael wright male 25 1921 alvarez jonte walterlarry@yahoo.com +universidad del salvador técnico para bioterios 2021-02-01 susan barker female 18 5596 12 de octubre bergeralejandra@gmail.com +universidad del salvador diseño de imagen y sonido 2021-02-01 audrey haynes female 19 8180 colonia dr gdor udaondo hallkatelyn@yahoo.com +universidad del salvador licenciatura en gestión de agroalimentos 2021-02-01 vincent welch male 29 6417 casbas garrett30@yahoo.com +universidad del salvador actuario 2021-02-01 kyle melendez male 33 1776 9 de abril emilycurry@hotmail.com +universidad del salvador licenciatura en sociología 2021-02-01 melissa mcclure female 33 6339 cailomuta rickey75@gmail.com +universidad del salvador ingeniería mecánica 2021-02-01 michael moses male 31 2703 cabo san fermin laura79@hotmail.com +universidad del salvador licenciatura en kinesiología y fisiatría 2021-02-01 lisa johnson female 29 7637 la dulce abigail27@yahoo.com +universidad del salvador licenciatura en producción de bioimagenes 2021-02-01 pamela clark female 19 1618 ricardo rojas william03@hotmail.com +universidad del salvador ingeniería en informática 2021-02-01 renee walker female 21 1815 escuela agricola don bosco cbrown@yahoo.com diff --git a/datasets/README.md b/datasets/README.md index cff39c73..bb3ad23f 100644 --- a/datasets/README.md +++ b/datasets/README.md @@ -1 +1 @@ -Aqui se dejarán los resultantes del proceso de transformación. \ No newline at end of file +Aqui se dejarán los resultantes del proceso de transformación. diff --git a/files/GBUNComahue_select.csv b/files/GBUNComahue_select.csv new file mode 100644 index 00000000..17aeba4e --- /dev/null +++ b/files/GBUNComahue_select.csv @@ -0,0 +1,1832 @@ +,universidad,carrera,fecha_de_inscripcion,name,sexo,fecha_nacimiento,codigo_postal,correo_electronico +0,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-09-01,GREGORY HOWELL,M,1954-10-13,5315,FRANKALEXANDRA@YAHOO.COM +1,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-09-01,TASHA BROWN,F,1984-11-29,8305,TEDWARDS@GMAIL.COM +2,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-09-01,IAN TAYLOR,M,1976-11-23,3428,RICHARD76@GMAIL.COM +3,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-09-01,MARK SANCHEZ,M,2002-06-19,5873,ODUFFY@YAHOO.COM +4,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-09-01,SHERRI CARTER,F,1923-01-17,1765,FOSTERCHASE@GMAIL.COM +5,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-09-01,PATRICIA GARDNER,F,1974-05-10,3197,HUGHESNINA@YAHOO.COM +6,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-09-01,MARISSA JOHNS,F,1988-10-15,6034,JOHN91@YAHOO.COM +7,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-09-01,CRYSTAL WILLIAMS,F,1949-01-28,6017,LEEBRAD@YAHOO.COM +8,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-09-01,NICOLE SMITH,F,1909-11-27,1925,JSHIELDS@YAHOO.COM +9,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-09-01,TIMOTHY DYER,M,1913-04-03,5429,MARIAJACKSON@HOTMAIL.COM +10,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-09-02,CHRISTINA LONG,F,1934-07-24,4750,WILLIAMMCPHERSON@YAHOO.COM +11,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-09-02,MICHELE RIVERA,F,1927-08-03,2721,EWINGDIANA@GMAIL.COM +12,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-09-02,STEVEN MAY,M,1925-09-04,6437,PEREZCHRISTOPHER@YAHOO.COM +13,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-09-02,MARY LARSON,F,1909-11-26,7519,MICHAELWHITE@YAHOO.COM +14,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-09-02,KENNETH HENRY,M,2007-06-01,8170,QYOUNG@HOTMAIL.COM +15,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-09-02,CARMEN CLARK,F,1978-10-28,5741,RICHARDJOHNSON@GMAIL.COM +16,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-09-02,HALEY CARPENTER,F,1955-03-29,3585,YSHEPHERD@YAHOO.COM +17,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-09-02,ANGELA SIMMONS,F,1939-09-03,3158,STONEKIMBERLY@YAHOO.COM +18,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-09-02,MATTHEW WILSON,M,1957-04-12,5835,CAMPBELLDAVID@GMAIL.COM +19,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-09-02,JOHN HERNANDEZ,M,1965-06-21,3172,LISA58@GMAIL.COM +20,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-09-02,JOSEPH MCCARTHY,M,1986-03-25,2931,LAURENCHURCH@HOTMAIL.COM +21,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-09-02,MICHAEL DIAZ,M,1945-03-24,5557,WOODSYDNEY@HOTMAIL.COM +22,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-09-02,SHAWN THOMAS,M,1988-09-01,5317,WILLIAM73@HOTMAIL.COM +23,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-09-02,JULIE GUERRERO,F,1936-05-06,3109,WARNERSHIRLEY@GMAIL.COM +24,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-09-02,MELISSA NEWTON,F,1998-09-14,2527,NELSONMEGAN@YAHOO.COM +25,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-09-03,ALLEN SKINNER,M,1986-06-08,6651,MARKSMITH@GMAIL.COM +26,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-09-03,ERIN JENNINGS,F,1988-03-03,6307,MARTINEZSTEPHANIE@GMAIL.COM +27,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-09-03,STACEY KIDD,F,1945-09-11,2715,ZSEXTON@HOTMAIL.COM +28,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-09-03,WARREN TORRES,M,1977-10-17,3111,BISHOPKEVIN@HOTMAIL.COM +29,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-09-03,NATALIE GILBERT,F,1944-11-05,3134,COWANJENNIFER@GMAIL.COM +30,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-09-03,MARGARET JIMENEZ,F,2018-03-29,3192,JENNIFERTHOMPSON@YAHOO.COM +31,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-09-03,KRISTOPHER WRIGHT,M,2004-02-21,1842,ELLIOTTASHLEY@GMAIL.COM +32,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-09-03,TODD WARREN,M,1938-12-11,2142,DEBRA01@HOTMAIL.COM +33,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-09-03,IAN FREEMAN,M,1924-11-28,2630,JOSHUAMORGAN@HOTMAIL.COM +34,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-09-04,ALEXIS FORD,F,1957-06-20,7400,WESTTAMARA@GMAIL.COM +35,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-09-04,DAWN ROBERTS,F,2003-03-08,6321,MANNINGBARBARA@YAHOO.COM +36,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-09-04,JASON MONTES,M,1925-08-09,3194,WBRYANT@HOTMAIL.COM +37,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-09-04,JESSE FRAZIER,M,1934-01-31,6233,MATTHEW83@YAHOO.COM +38,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-09-04,ANTHONY JACKSON,M,1950-06-24,8534,WILLIAMSTRACY@YAHOO.COM +39,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-09-04,SHERRI HESTER,F,1999-08-09,8347,DONALDREILLY@GMAIL.COM +40,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-09-04,ANITA MARTINEZ,F,2016-09-13,1890,OKELLEY@GMAIL.COM +41,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-09-04,ANDRE GUTIERREZ,M,1921-06-07,5600,JASONJONES@HOTMAIL.COM +42,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-09-04,CATHERINE MAY,F,1984-02-14,1664,ANTHONYJOHNSON@HOTMAIL.COM +43,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-09-04,JEFFREY OBRIEN,M,1954-06-03,3337,TRANSCOTT@YAHOO.COM +44,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-09-04,AMANDA HILL,F,1909-10-18,8105,GREGORYBAKER@YAHOO.COM +45,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-09-04,TRACEY ANDERSON,F,1998-02-05,1927,SROWE@GMAIL.COM +46,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-09-04,ANGELA GILMORE,F,2004-07-15,3536,JOHNSONTARA@HOTMAIL.COM +47,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-09-04,CARLA BARNES DDS,F,1907-05-20,5384,HALLIAN@GMAIL.COM +48,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-09-05,MATTHEW FROST,M,1908-06-25,6042,HPARKER@HOTMAIL.COM +49,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-09-05,ZACHARY JACKSON,M,1994-11-25,6455,RODRIGUEZSCOTT@HOTMAIL.COM +50,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-09-05,AMY MENDOZA,F,1948-03-08,2508,CHAMBERSKEVIN@GMAIL.COM +51,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-09-05,ZACHARY OBRIEN,M,2015-05-15,3366,RYANLEE@HOTMAIL.COM +52,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-09-05,CRAIG RICHARDS,M,1919-08-01,5439,JENNIFER39@GMAIL.COM +53,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-09-05,THOMAS BROWN,M,1993-10-21,1770,LSANFORD@GMAIL.COM +54,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-09-05,LEAH BRANCH DVM,F,1953-04-27,4000,MASONKEVIN@YAHOO.COM +55,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-09-05,ASHLEY SCOTT,F,1980-09-19,4516,ASIMMONS@YAHOO.COM +56,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-09-05,FRANK ROBINSON,M,1942-05-08,5596,PMANNING@YAHOO.COM +57,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-09-05,KELLI RIVERA,F,2021-06-21,8363,OYOUNG@HOTMAIL.COM +58,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-09-05,VICKI PHILLIPS,F,2016-11-27,7011,ROBERTSLISA@HOTMAIL.COM +59,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-09-06,EDWARD TAYLOR,M,1965-11-30,9050,WHITEHEADSHANE@HOTMAIL.COM +60,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-09-06,NICHOLAS JOHNSON,M,1945-01-31,3461,YTORRES@GMAIL.COM +61,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-09-06,JAMES PETTY,M,1969-03-13,5521,ETHANJIMENEZ@HOTMAIL.COM +62,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-09-06,JAMIE SMITH,F,1993-09-14,2216,ZACHARY24@YAHOO.COM +63,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-09-06,ANDREW MYERS,M,1939-01-20,7533,BREANNAWARD@YAHOO.COM +64,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-09-06,JULIA MILLS,F,1988-05-25,6503,KOCHRICKEY@HOTMAIL.COM +65,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-09-06,CATHERINE MANN,F,2005-11-24,4230,KATELYNWEST@HOTMAIL.COM +66,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-09-06,VALERIE HUGHES,F,1941-06-05,7203,SMCDONALD@GMAIL.COM +67,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-09-07,RICHARD BROWN,M,1971-04-03,1601,CHELSEY16@HOTMAIL.COM +68,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-09-07,CATHERINE BUSH,F,2001-12-17,2309,AMANDADOYLE@GMAIL.COM +69,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-09-07,NICHOLAS VASQUEZ,M,1976-11-02,2185,NBURGESS@HOTMAIL.COM +70,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-09-07,SAMANTHA FERGUSON,F,2003-03-26,2445,ALYSSAMOORE@HOTMAIL.COM +71,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-09-07,EMILY PAGE,F,1946-07-09,2705,ROBERT29@HOTMAIL.COM +72,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-09-07,AMANDA DIAZ,F,1994-03-22,3344,JEFFERYDENNIS@HOTMAIL.COM +73,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-09-07,CHRISTINE MAYER,F,2014-02-04,2156,TAYLORDANA@YAHOO.COM +74,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-09-07,DAVID JONES,M,1922-12-11,1842,HERNANDEZMEGAN@GMAIL.COM +75,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-09-07,MARK BRADLEY,M,1942-04-27,2113,TWEBB@GMAIL.COM +76,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-09-07,JOHN BOWEN,M,1916-01-30,2824,RHART@GMAIL.COM +77,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-09-07,ROBERT MORENO,M,1934-03-08,3574,NWATSON@YAHOO.COM +78,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-09-07,ANDREA ALEXANDER,F,1991-06-11,1896,CHRISTINA09@GMAIL.COM +79,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-09-07,FELICIA VALDEZ,F,1921-09-18,3620,GREENEFREDERICK@YAHOO.COM +80,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-09-07,MICHELE ROMERO,F,1997-06-10,1739,SALINASJANICE@YAHOO.COM +81,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-09-07,MICHAEL MOSLEY,M,1962-08-22,6500,DONNAJONES@HOTMAIL.COM +82,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-09-07,CHARLES LEACH,M,1964-12-04,5779,BARBARATURNER@YAHOO.COM +83,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-09-08,MICHAEL SIMPSON,M,1910-08-26,6652,DAVIDGAINES@YAHOO.COM +84,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-09-08,AMANDA JORDAN,F,1939-09-10,3522,ROBERT92@GMAIL.COM +85,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-09-08,JESSICA ROSS,F,1928-08-27,6003,ROBERT92@YAHOO.COM +86,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-09-08,DARLENE GARNER,F,1921-03-06,3366,JMADDEN@HOTMAIL.COM +87,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-09-08,PATRICK GARRETT,M,1983-09-21,4186,GREENECHARLES@YAHOO.COM +88,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-09-08,ZOE OCONNELL,F,1908-07-01,5419,JILL45@GMAIL.COM +89,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-09-08,MICHELLE SHELTON,F,1906-05-14,3427,BREWERAMBER@GMAIL.COM +90,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-09-08,MEGAN MENDOZA,F,1984-11-19,3416,MICHELLELYNCH@HOTMAIL.COM +91,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-09-08,JOSEPH ESTRADA,M,1908-01-13,6643,OATKINSON@GMAIL.COM +92,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-09-09,JENNIFER MAY,F,1978-12-08,5474,AARON63@GMAIL.COM +93,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-09-09,JORDAN GILMORE,M,1970-09-13,3472,WSPENCER@HOTMAIL.COM +94,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-09-09,MICHAEL THOMPSON,M,1992-02-22,2824,KIMBERLY13@GMAIL.COM +95,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-09-09,DR. JAMES TAYLOR DDS,M,1935-10-25,2500,SHEENASILVA@HOTMAIL.COM +96,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-09-09,KIM BURTON,F,1948-02-15,5438,ROGERSDAVID@YAHOO.COM +97,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-09-09,TRICIA EVANS,F,1962-05-31,5589,MILLERGREGORY@HOTMAIL.COM +98,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-09-09,KIRK CALDERON,M,1910-02-11,2609,CPALMER@HOTMAIL.COM +99,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-09-09,KIMBERLY CALDERON,F,1955-04-12,3181,GGRAHAM@GMAIL.COM +100,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-09-09,ERIN REEVES,F,1923-08-16,2854,TIMOTHYVEGA@YAHOO.COM +101,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-09-09,RACHEL NEWMAN,F,1984-07-02,1678,OSCARNIELSEN@YAHOO.COM +102,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-09-09,RACHEL LANE,F,2011-04-13,5423,SANDERSBRANDY@GMAIL.COM +103,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-09-09,MELVIN CASTRO,M,1975-04-15,2527,KEITHGLENN@GMAIL.COM +104,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-09-09,TRICIA MENDOZA,F,1936-02-14,6244,SMITHBRYAN@YAHOO.COM +105,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-09-09,BRITTANY SOTO,F,1983-07-17,5511,DUSTIN57@YAHOO.COM +106,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-09-09,MRS. REGINA REID,F,1930-09-25,5345,PERRYNOAH@YAHOO.COM +107,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-09-10,STACY HALL MD,F,1980-12-16,2828,ZWALTERS@HOTMAIL.COM +108,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-09-10,MONICA GARCIA,F,1988-07-22,6239,ALLISON79@GMAIL.COM +109,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-09-10,RODNEY NEAL,M,1955-10-11,1646,SCHMITTANTHONY@HOTMAIL.COM +110,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-09-10,MELISSA NELSON,F,1944-10-23,6230,AMCCORMICK@HOTMAIL.COM +111,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-09-10,JASON WYATT,M,1905-11-21,3216,RLOWE@GMAIL.COM +112,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-09-10,DUANE FOWLER,M,2019-01-26,1872,STEVEN63@HOTMAIL.COM +113,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-09-10,KATHERINE BENSON,F,1910-06-17,7118,UJONES@HOTMAIL.COM +114,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-09-10,JOHN PARKS,M,1962-01-06,7165,MBALDWIN@HOTMAIL.COM +115,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-09-10,ERICA HAMPTON,F,1984-07-21,6700,CARMENWARREN@YAHOO.COM +116,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-09-10,SHERRY JOHNSON,F,1987-02-14,5636,JANET27@HOTMAIL.COM +117,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-09-10,JACK JACKSON,M,1935-09-07,8333,EJONES@HOTMAIL.COM +118,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-09-10,TIFFANY CONTRERAS,F,1926-10-14,3203,DANIELLEGRAHAM@HOTMAIL.COM +119,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-09-10,JENNIFER FOX,F,1940-07-05,3196,QSTRICKLAND@GMAIL.COM +120,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-09-10,STEVEN SMITH,M,1999-06-29,1627,KRISTIN73@GMAIL.COM +121,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-09-11,LARRY MARTINEZ,M,1963-08-11,3057,PETERHESS@GMAIL.COM +122,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-09-11,THERESA BENTLEY,F,2007-01-17,1879,HOLSON@GMAIL.COM +123,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-09-11,LISA VINCENT,F,1920-11-08,6667,GOMEZJOSE@YAHOO.COM +124,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-09-11,JENNY VALDEZ,F,1930-03-02,6701,WILEYJACQUELINE@HOTMAIL.COM +125,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-09-11,CHRISTOPHER GUTIERREZ,M,1954-09-08,2121,JRUSH@GMAIL.COM +126,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-09-11,AMANDA DYER,F,1936-04-22,2208,SRODRIGUEZ@YAHOO.COM +127,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-09-11,MELISSA WALLACE,F,1912-03-07,1870,THOMAS12@GMAIL.COM +128,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-09-11,MARIO ROSALES,M,2010-04-17,8424,XCARROLL@YAHOO.COM +129,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-09-11,HALEY ADKINS,F,1974-08-21,5444,GARRISONSTACIE@YAHOO.COM +130,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-09-11,CARLOS JOHNSON,M,1975-02-13,6614,OWENGEORGE@YAHOO.COM +131,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-09-11,HANNAH BALLARD,F,2021-09-23,7249,MONIQUE87@GMAIL.COM +132,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-09-11,RONNIE WOOD,M,2004-02-07,7169,LEWISLISA@HOTMAIL.COM +133,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-09-11,STEVEN FIELDS,M,1929-08-31,1686,BROOKEWHITE@YAHOO.COM +134,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-09-12,MEGAN GREEN,F,1947-12-28,2134,HEATHER75@YAHOO.COM +135,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-09-12,RICHARD SANCHEZ,M,1968-10-13,5470,YYATES@YAHOO.COM +136,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-09-12,JOEL KELLY,M,1987-11-14,9030,CHRISTOPHER34@GMAIL.COM +137,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-09-12,ASHLEY SCHULTZ,F,1987-08-03,3234,FJIMENEZ@YAHOO.COM +138,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-09-12,CASSANDRA MOORE,F,1971-03-07,3183,THOMPSONBRANDON@YAHOO.COM +139,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-09-12,SCOTT EVANS,M,1998-01-08,2812,MARKJACKSON@HOTMAIL.COM +140,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-09-12,CHRISTOPHER LANE,M,1962-02-25,2800,RYAN53@GMAIL.COM +141,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-09-12,DAVID MILLER,M,1956-01-21,2138,DEBORAHLEWIS@GMAIL.COM +142,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-09-12,HANNAH MOORE,F,2016-01-24,1812,TAYLORMIKAYLA@HOTMAIL.COM +143,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-09-12,COREY LINDSEY,M,1964-01-25,4109,PAIGETREVINO@YAHOO.COM +144,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-09-12,MATTHEW GAMBLE,M,1999-02-24,7150,ACARROLL@YAHOO.COM +145,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-09-12,MOLLY FOWLER,F,1953-05-05,8187,STEPHANIE22@YAHOO.COM +146,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-09-12,AARON ROY,M,1940-05-18,1865,JOHNGUZMAN@GMAIL.COM +147,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-09-13,JESSE KELLEY,M,1922-12-20,8208,WOODNICOLE@GMAIL.COM +148,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-09-13,CARL SMITH,M,1919-04-01,7240,SPEARSJARED@YAHOO.COM +149,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-09-13,TYLER YOUNG,M,2001-06-17,7407,JAMES90@HOTMAIL.COM +150,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-09-13,JOSEPH GREGORY,M,1912-12-21,5730,BRENDA13@GMAIL.COM +151,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-09-13,NICHOLE PAYNE,F,1991-03-22,5535,FRAZIERSUSAN@YAHOO.COM +152,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-09-13,CHARLES CARTER,M,1911-06-15,5753,DAVID64@YAHOO.COM +153,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-09-13,RODNEY JACOBSON,M,1992-02-17,7136,WESTJOSEPH@HOTMAIL.COM +154,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-09-13,SANDRA JOHNSON,F,1951-04-24,5565,XMEZA@GMAIL.COM +155,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-09-14,VERONICA WILSON,F,1985-08-01,5555,YVELAZQUEZ@GMAIL.COM +156,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-09-14,JASON CHEN,M,2000-04-11,5343,GARNERANTHONY@HOTMAIL.COM +157,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-09-14,MICHAEL JACKSON,M,1973-02-13,9225,HOLLY00@YAHOO.COM +158,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-09-14,KIMBERLY MCLEAN,F,1945-04-23,5327,ROBINSONDAVID@YAHOO.COM +159,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-09-14,ANTHONY HERNANDEZ,M,1993-04-20,1986,ROBERT92@HOTMAIL.COM +160,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-09-14,CRYSTAL CARPENTER,F,1955-01-18,3218,ALICIA62@GMAIL.COM +161,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-09-14,MR. ALEX COPELAND,M,1944-09-21,5763,WELLIS@HOTMAIL.COM +162,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-09-14,CINDY MARTIN,F,1946-06-10,2527,LYNNHOLLAND@YAHOO.COM +163,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-09-14,BRIAN ARMSTRONG,M,1920-10-27,2218,GMILLER@GMAIL.COM +164,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-09-15,SARA BELL,F,1950-06-28,5407,IHOOVER@YAHOO.COM +165,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-09-15,KIMBERLY THOMAS,F,1942-03-19,3705,JHARRIS@YAHOO.COM +166,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-09-15,SCOTT HORTON,M,1997-08-10,2520,SARAH39@YAHOO.COM +167,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-09-15,THERESA LE,F,1992-02-10,2121,PAULCORTEZ@GMAIL.COM +168,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-09-15,JOANNE ANDERSON,F,2019-07-26,5306,JOSEPH32@YAHOO.COM +169,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-09-15,STEVEN HARPER,M,1912-05-19,6075,JENNIFER14@HOTMAIL.COM +170,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-09-15,DAVID LARA,M,1944-09-26,4722,NZAMORA@GMAIL.COM +171,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-09-15,NATHAN VAUGHN,M,1988-09-03,6661,COREYSHARP@HOTMAIL.COM +172,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-09-15,BONNIE RILEY,F,1933-03-09,4622,JASON74@YAHOO.COM +173,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-09-15,ALEXANDER KRAMER,M,2021-01-23,2944,JESSE67@YAHOO.COM +174,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-09-15,MALLORY MOORE,F,1914-06-24,2907,HAYDENTHOMAS@GMAIL.COM +175,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-09-16,DEREK WEBB,M,1940-05-24,3072,MARYMORENO@HOTMAIL.COM +176,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-09-16,CHRISTOPHER MACK,M,1992-10-25,9409,JOSHUA96@YAHOO.COM +177,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-09-16,ARTHUR ARELLANO,M,2005-10-28,8200,PARRISHKELLY@YAHOO.COM +178,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-09-16,CINDY BISHOP,F,1931-04-03,6050,VICKIEJENKINS@HOTMAIL.COM +179,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-09-16,PAULA PETERS,F,1949-07-24,9315,SAMANTHAHATFIELD@GMAIL.COM +180,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-09-16,SHERRY HOFFMAN,F,1938-06-25,4431,MARYREED@HOTMAIL.COM +181,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-09-16,MISS JESSICA BURNS,F,1915-08-31,6538,JEFFREYDAVIS@GMAIL.COM +182,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-09-16,KEVIN FITZGERALD,M,1947-11-02,5266,ADAVENPORT@GMAIL.COM +183,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-09-16,RYAN CURTIS,M,1958-12-31,2344,NELSONAMY@YAHOO.COM +184,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-09-16,JOHN JONES,M,1913-10-22,2300,SHELTONMATTHEW@GMAIL.COM +185,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-09-16,DEBORAH CARTER,F,1951-03-18,6700,RICHARDJOHNSON@GMAIL.COM +186,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-09-17,DAVID LUNA,M,1971-06-12,3117,HGARDNER@YAHOO.COM +187,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-09-17,JASON HERNANDEZ,M,1913-08-08,6009,PDAVIS@GMAIL.COM +188,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-09-17,DEBORAH WILSON,F,2020-09-30,9400,KAREN52@GMAIL.COM +189,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-09-17,AMY SMITH,F,2003-07-13,9223,ESPINOZAJESSICA@YAHOO.COM +190,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-09-17,JOSEPH STEVENSON,M,1924-06-23,7172,ANDREW27@HOTMAIL.COM +191,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-09-17,GEORGE SCHULTZ,M,1936-11-17,7160,DWRIGHT@GMAIL.COM +192,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-09-17,MEGAN GARDNER,F,1911-06-28,2933,KYLE23@YAHOO.COM +193,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-09-17,JESSICA BURNS,F,2015-01-22,2613,THOMAS03@GMAIL.COM +194,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-09-17,TONYA NGUYEN,F,1973-09-01,2200,NATHANHOOVER@YAHOO.COM +195,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-09-17,TROY LAWRENCE,M,2008-07-06,6430,JAMES77@GMAIL.COM +196,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-09-17,SUZANNE PHILLIPS,F,1928-01-26,4643,TPOWERS@HOTMAIL.COM +197,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-09-17,NANCY JONES,F,1933-08-21,1746,RANDY73@GMAIL.COM +198,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-09-18,KAREN CASTILLO,F,2020-04-05,9039,WALKERRODNEY@YAHOO.COM +199,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-09-18,CHRISTIAN SANCHEZ,M,2012-05-25,6641,ALEXIS34@YAHOO.COM +200,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-09-18,TONY YOUNG,M,1982-12-30,2347,GORDONWILLIAM@YAHOO.COM +201,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-09-18,LORI SANFORD,F,1998-10-14,6628,XWIGGINS@HOTMAIL.COM +202,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-09-18,JANE CAMPBELL,F,2002-08-16,7311,GILLESPIEBRIAN@YAHOO.COM +203,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-09-18,SANDRA MILLER,F,1925-12-10,6065,THORNTONKIMBERLY@HOTMAIL.COM +204,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-09-18,KATHY POWELL,F,1962-08-23,3133,CHRIS21@HOTMAIL.COM +205,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-09-18,CHRISTOPHER HICKMAN,M,1926-03-07,7220,DLOPEZ@GMAIL.COM +206,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-09-19,CHARLES GARDNER,M,1944-06-22,7408,VBURNETT@YAHOO.COM +207,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-09-19,WENDY GREEN,F,1978-09-09,1858,TINAMCCANN@HOTMAIL.COM +208,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-09-19,SHARON HUGHES,F,1971-07-12,4147,GARYREILLY@HOTMAIL.COM +209,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-09-19,PATRICIA BROWN,F,1966-01-18,2843,JACOBGARCIA@HOTMAIL.COM +210,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-09-19,GARY BERRY,M,2000-06-20,4724,JENNIFER89@YAHOO.COM +211,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-09-19,ALEXANDRIA LEE,F,1925-10-04,8305,FRANKJASON@GMAIL.COM +212,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-09-19,MICHELLE SIMMONS,F,1926-01-11,1655,BRENDAN58@GMAIL.COM +213,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-09-19,MARK ESPINOZA,M,1984-10-04,1822,HFRANK@HOTMAIL.COM +214,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-09-19,ROBERT MOORE,M,1959-01-28,3085,LORIWONG@HOTMAIL.COM +215,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-09-19,RICARDO TAYLOR,M,1919-07-08,1684,WHITNEY61@HOTMAIL.COM +216,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-09-19,PAUL BROWN,M,1978-04-29,2752,ZWILCOX@YAHOO.COM +217,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-09-19,MARTHA MORGAN,F,1938-08-22,6203,TRACYWILKINSON@HOTMAIL.COM +218,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-09-19,ROBERT CARPENTER,M,1937-03-10,5461,ANTHONYSMITH@HOTMAIL.COM +219,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-09-19,TAYLOR DUNCAN,F,2000-04-01,5755,PHILLIP16@YAHOO.COM +220,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-09-20,BRENDA ANDERSON,F,1925-06-25,9107,TUCKERRICHARD@YAHOO.COM +221,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-09-20,IAN CARTER,M,1981-06-29,4152,HARRISONDAVID@GMAIL.COM +222,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-09-20,MARIA HALL,F,1997-04-24,3164,BJACKSON@GMAIL.COM +223,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-09-20,LINDA COLLINS,F,1935-04-22,2852,FCLARK@GMAIL.COM +224,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-09-20,CHARLES TORRES,M,1917-07-28,2506,RALPH16@YAHOO.COM +225,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-09-20,DANA GONZALEZ,F,2017-03-07,6601,GARCIAJESSE@HOTMAIL.COM +226,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-09-20,RITA THOMAS DVM,F,2007-05-01,4237,JACOBWARREN@YAHOO.COM +227,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-09-20,CHRISTOPHER MORRIS,M,1990-09-18,6343,QGONZALEZ@YAHOO.COM +228,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-09-20,CHRISTOPHER MOORE,M,1931-12-09,8303,CASSANDRACRUZ@GMAIL.COM +229,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-09-20,STANLEY STEVENSON,M,1931-03-10,5431,MONICADUNCAN@HOTMAIL.COM +230,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-09-21,JACQUELINE SNYDER,F,1985-10-05,8400,CHARLESORTIZ@YAHOO.COM +231,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-09-21,KIMBERLY SMITH,F,1946-01-18,5713,KEVINRIVERA@GMAIL.COM +232,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-09-21,REGINALD SHEPHERD,M,1923-05-02,7107,DUDLEYCURTIS@HOTMAIL.COM +233,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-09-21,DONALD BYRD,M,2001-11-21,5523,MELINDA63@GMAIL.COM +234,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-09-21,JONATHAN MEDINA,M,2014-12-17,8208,NICHOLSCARLOS@GMAIL.COM +235,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-09-21,JAMES BAKER,M,1927-11-22,1802,STEVEN22@YAHOO.COM +236,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-09-21,WESLEY KING,M,1934-02-17,8412,AMARTIN@HOTMAIL.COM +237,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-09-21,ROBERT WRIGHT,M,1918-11-05,4622,ASHLEYMARTINEZ@GMAIL.COM +238,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-09-21,BRIAN STEVENS,M,2006-03-05,5547,MICHAEL62@GMAIL.COM +239,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-09-21,ROBERT LONG,M,1994-04-22,6648,YGREEN@GMAIL.COM +240,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-09-21,CONNIE MOORE,F,1951-07-15,1655,STARKJOHN@HOTMAIL.COM +241,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-09-21,OMAR ROSS,M,1922-03-06,7165,MATTHEWKING@GMAIL.COM +242,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-09-21,CHERYL NIELSEN,F,2008-03-02,2204,LINDAEVANS@GMAIL.COM +243,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-09-21,JOSEPH MITCHELL,M,1911-12-22,2156,JIMMYMORENO@GMAIL.COM +244,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-09-22,MARTHA AYALA,F,1980-07-08,4105,JSMITH@YAHOO.COM +245,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-09-22,ERIKA LEE,F,2016-12-31,7635,PEGGYJONES@GMAIL.COM +246,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-09-22,BRANDY ROBINSON,F,1945-07-22,5533,MASONHOFFMAN@HOTMAIL.COM +247,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-09-22,EUGENE WONG,M,1950-02-11,8373,LISA17@GMAIL.COM +248,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-09-22,MANUEL ENGLISH,M,1984-01-30,6652,XHILL@HOTMAIL.COM +249,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-09-22,CLAUDIA PEREZ,F,1917-08-24,8308,XRICHARDSON@YAHOO.COM +250,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-09-22,KIMBERLY ESPARZA,F,1994-12-04,8307,JEFFREYCOOPER@GMAIL.COM +251,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-09-22,PATRICIA WILSON,F,2005-04-27,3051,JOSHUARAMIREZ@YAHOO.COM +252,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-09-22,JULIAN SMITH,M,1989-04-27,7412,ANTHONYREBEKAH@HOTMAIL.COM +253,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-09-23,CHAD LEE DDS,M,1909-07-21,6065,AWALKER@YAHOO.COM +254,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-09-23,PAUL MOORE,M,1937-01-13,8153,TAMARASANTOS@GMAIL.COM +255,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-09-23,KIM HOFFMAN,F,1980-08-29,5381,SOBRIEN@YAHOO.COM +256,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-09-23,JOSEPH GRAY,M,2007-10-06,5615,JONESRYAN@YAHOO.COM +257,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-09-23,JOHNNY CARTER,M,1920-03-28,7208,DOUGLAS26@HOTMAIL.COM +258,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-09-23,ANTHONY JOHNSON,M,1965-06-25,5624,JOSHUARODRIGUEZ@HOTMAIL.COM +259,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-09-23,SARAH MARTIN,F,1979-10-08,3113,YHUGHES@GMAIL.COM +260,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-09-23,MARIA ANDERSON,F,1984-03-15,5605,TANYA29@YAHOO.COM +261,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-09-24,JAMES GARRISON,M,1923-10-11,5261,ANGELAHIGGINS@HOTMAIL.COM +262,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-09-24,AMBER HALL,F,1970-06-24,7267,BHOWARD@YAHOO.COM +263,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-09-24,JOANNA ADAMS,F,1938-02-07,4101,PEREZJONATHAN@HOTMAIL.COM +264,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-09-24,LISA HOLDEN,F,1919-07-02,2454,CHRISTOPHERMORGAN@YAHOO.COM +265,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-09-24,SUSAN WALLACE,F,2003-03-13,2828,LAUREN17@GMAIL.COM +266,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-09-24,KATHERINE MITCHELL,F,1962-11-19,3013,MICHAELROMERO@GMAIL.COM +267,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-09-24,RICHARD STEPHENS,M,1907-02-12,6216,KMOORE@YAHOO.COM +268,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-09-24,JULIA LOPEZ,F,1934-04-21,6507,PACHECOSTEVEN@GMAIL.COM +269,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-09-24,DAVID SANDERS,M,2003-08-12,6461,RAVENGILL@YAHOO.COM +270,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-09-24,TYLER LEE,M,1973-07-04,2854,ANTHONYKING@GMAIL.COM +271,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-09-24,ASHLEY RANDALL,F,2019-11-27,1708,RSCOTT@GMAIL.COM +272,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-09-24,BREANNA WELLS,F,2020-09-20,5710,KEVIN45@YAHOO.COM +273,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-09-24,BRITTNEY GIBSON,F,2011-08-03,4159,JOHNNYBRADLEY@HOTMAIL.COM +274,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-09-24,JOSEPH BOYER,M,1906-03-07,2216,GARY33@HOTMAIL.COM +275,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-09-24,MATTHEW CASTILLO,M,1973-07-28,5417,SMITHJOSHUA@HOTMAIL.COM +276,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-09-24,JAMES EDWARDS,M,2008-09-28,6557,BETTYBELL@GMAIL.COM +277,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-09-25,MR. MATTHEW TAYLOR,M,1996-10-20,3060,CHRISTOPHERPETERSON@GMAIL.COM +278,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-09-25,WILLIAM FIGUEROA,M,1918-12-04,7404,KATHLEEN16@YAHOO.COM +279,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-09-25,ALICIA ZIMMERMAN,F,1972-03-31,6453,JASONPARKS@HOTMAIL.COM +280,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-09-25,BRITTANY HOLT,F,1911-01-10,3511,DENISE76@GMAIL.COM +281,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-09-25,KATHRYN GARCIA,F,2011-04-24,7407,DONNAROSS@YAHOO.COM +282,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-09-25,MARY MORSE,F,1934-01-19,3486,CAMERONPEGGY@HOTMAIL.COM +283,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-09-25,LORI HERNANDEZ,F,2004-10-21,3714,JUSTINGONZALES@YAHOO.COM +284,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-09-25,SHERRY SMITH,F,1958-11-24,3007,KARENMCCOY@YAHOO.COM +285,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-09-25,JAKE GOMEZ,M,1910-10-18,2403,HEATHER62@HOTMAIL.COM +286,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-09-25,GREGORY BAKER,M,2017-05-03,5579,HERNANDEZCHRISTIAN@YAHOO.COM +287,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-09-25,KAITLYN RICE,F,1908-01-23,4143,DPARKER@GMAIL.COM +288,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-09-26,AMY DELACRUZ,F,1931-08-01,8109,BRITTANYHOLDER@YAHOO.COM +289,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-09-26,DEBORAH GARCIA,F,1978-12-16,2801,MARTINMICHELLE@GMAIL.COM +290,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-09-26,KEVIN SMITH,M,1965-07-17,2900,KELSEYDUNCAN@HOTMAIL.COM +291,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-09-26,DONALD JONES,M,1911-08-17,7109,JEFFREY29@GMAIL.COM +292,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-09-26,MARK FAULKNER,M,1934-01-27,1871,ENGLISHLINDSAY@YAHOO.COM +293,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-09-26,ALBERT BOOKER,M,1967-01-29,5407,KCAREY@HOTMAIL.COM +294,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-09-26,JULIA MILLER,F,2018-05-02,1714,EMIDDLETON@HOTMAIL.COM +295,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-09-26,SHAWN CAMPBELL,M,1987-11-05,6383,BOWMANTAMMY@YAHOO.COM +296,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-09-26,TAYLOR TANNER,F,1938-05-20,5306,GTHOMAS@HOTMAIL.COM +297,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-09-26,DAVID KNIGHT,M,1964-09-04,4648,TYLER23@YAHOO.COM +298,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-09-26,SHANNON CUEVAS,F,1960-12-03,2930,GARNERSHAWN@YAHOO.COM +299,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-09-26,JOSHUA HERNANDEZ,M,2017-02-04,3374,KEVINPARKER@GMAIL.COM +300,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-09-26,BRANDON HAMILTON,M,1956-10-01,5407,OHOLT@GMAIL.COM +301,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-09-26,ADAM BAKER,M,1921-07-03,6643,LNEWMAN@YAHOO.COM +302,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-09-26,SANDRA KNAPP,F,2011-04-10,6628,QMCGRATH@YAHOO.COM +303,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-09-26,CHARLES ROSARIO,M,1996-12-21,7105,DONALDHORN@GMAIL.COM +304,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-09-26,KIMBERLY BOOTH,F,1955-05-24,3364,JACOB03@YAHOO.COM +305,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-09-26,JEANNE RODRIGUEZ,F,1945-07-22,4701,JASON48@HOTMAIL.COM +306,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-09-27,AUDREY GUZMAN,F,1944-09-07,8107,JOSHUA14@HOTMAIL.COM +307,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-09-27,ANTHONY SKINNER,M,1914-08-12,3044,KAREN55@GMAIL.COM +308,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-09-27,JESSICA JONES,F,1986-09-10,8151,OBRENNAN@YAHOO.COM +309,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-09-27,DAVID FOSTER,M,1934-04-26,2187,ZJONES@HOTMAIL.COM +310,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-09-27,DANA MCGEE,F,2016-04-12,6511,NATHAN61@HOTMAIL.COM +311,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-09-27,JEFFREY RICHARDSON,M,1913-10-12,5303,LAURA56@HOTMAIL.COM +312,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-09-27,CHARLES JOHNSON,M,1915-06-07,3518,DAVID57@HOTMAIL.COM +313,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-09-27,ROBERT GATES,M,1947-05-17,2208,SUSANSANDOVAL@YAHOO.COM +314,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-09-27,MICHAEL BRIDGES,M,2010-01-26,2843,ANTHONY45@GMAIL.COM +315,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-09-27,ANTHONY SUTTON,M,1963-07-10,1884,JBLANCHARD@YAHOO.COM +316,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-09-27,TAMMY PEREZ,F,1917-12-10,1986,ESMITH@YAHOO.COM +317,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-09-27,CASSANDRA SANFORD,F,1984-10-16,2944,LUKE63@HOTMAIL.COM +318,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-09-27,TAYLOR JOHNSON,M,2015-05-15,6559,JACOBCUNNINGHAM@YAHOO.COM +319,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-09-27,KENNETH NEWMAN,M,1915-11-24,4176,EREEVES@YAHOO.COM +320,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-09-27,RAYMOND JOHNSON,M,1976-03-10,1741,JESSICAJACKSON@YAHOO.COM +321,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-09-27,ABIGAIL HILL,F,1909-07-13,5750,LLONG@HOTMAIL.COM +322,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-09-27,LAUREN MIRANDA,F,1915-07-22,8185,RONALD22@HOTMAIL.COM +323,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-09-27,DAVID HAAS,M,2008-07-08,5561,MICHELLE99@YAHOO.COM +324,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-09-27,LINDA FIGUEROA,F,1981-10-13,4142,VTORRES@YAHOO.COM +325,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-09-28,MICHELE YU,F,1959-03-20,6403,LINDSEYJORDAN@HOTMAIL.COM +326,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-09-28,ANDREW FOSTER,M,1993-01-21,6343,KRISTINJONES@GMAIL.COM +327,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-09-28,RICHARD WALKER,M,2010-03-04,5734,NRAYMOND@HOTMAIL.COM +328,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-09-28,KATHERINE NICHOLS,F,2006-08-01,4235,NEDWARDS@HOTMAIL.COM +329,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-09-28,MICHELE LOPEZ,F,1917-05-13,8105,HENDRIXVINCENT@GMAIL.COM +330,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-09-28,PEGGY EDWARDS,F,1914-11-01,3351,NIELSENANGEL@YAHOO.COM +331,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-09-28,MAURICE RICHARD,M,1915-04-09,7519,LWALKER@YAHOO.COM +332,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-09-28,LAURA NOLAN,F,2000-12-05,4650,COOKBARRY@GMAIL.COM +333,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-09-28,PATRICK MURPHY,M,1931-02-13,8307,KROBINSON@HOTMAIL.COM +334,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-09-28,RANDY TYLER,M,1941-04-02,3172,LESLIE36@HOTMAIL.COM +335,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-09-29,KELSEY POWELL,F,2012-05-29,4618,RICHARDSTREVOR@HOTMAIL.COM +336,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-09-29,JOSE GARRISON,M,2007-10-05,7600,RANDY41@GMAIL.COM +337,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-09-29,JESSICA OLSON,F,2006-08-31,5343,SHARRIS@YAHOO.COM +338,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-09-29,GILBERT KELLY,M,1973-03-14,5306,MARISSAMORGAN@HOTMAIL.COM +339,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-09-29,MICHAEL REYES,M,1929-03-07,5463,ANGELAWONG@GMAIL.COM +340,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-09-29,ALISON EWING,F,1987-12-27,8316,SCHMIDTELIZABETH@HOTMAIL.COM +341,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-09-29,HELEN LE,F,1950-10-03,2622,CASEY14@HOTMAIL.COM +342,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-09-29,ALLISON HILL,F,1993-10-26,6727,JENNIFERMILES@HOTMAIL.COM +343,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-09-29,LISA KLEIN,F,1997-05-21,5380,LESLIENUNEZ@YAHOO.COM +344,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-09-29,AMANDA EDWARDS,F,2007-03-15,2105,DEVINMOORE@YAHOO.COM +345,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-09-29,MICHELLE JOHNSON,F,2021-07-09,5442,DANA37@HOTMAIL.COM +346,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-09-29,HEATHER BURNS,F,1955-10-26,3313,MICHAEL54@GMAIL.COM +347,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-09-29,RICHARD CHAVEZ,M,1912-07-02,5275,JAMESHARTMAN@YAHOO.COM +348,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-09-30,ROBERT WARD,M,1968-08-25,3263,NSCHMIDT@GMAIL.COM +349,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-09-30,KENNETH RODRIGUEZ,M,1991-10-06,3401,STEPHANIEBENJAMIN@GMAIL.COM +350,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-09-30,KIMBERLY CAMPBELL,F,1963-12-09,9405,SUSAN73@GMAIL.COM +351,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-09-30,SCOTT WONG,M,1919-05-11,6360,BWILLIAMS@HOTMAIL.COM +352,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-09-30,JESSICA GRIFFIN,F,2005-04-06,3714,MARTINEZBONNIE@GMAIL.COM +353,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-09-30,DIANE JIMENEZ,F,1924-07-25,9407,SJOHNSON@YAHOO.COM +354,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-10-01,NICHOLAS JOHNSON,M,1983-09-27,2216,NICHOLASSALAZAR@HOTMAIL.COM +355,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-10-01,MICHAEL HESTER,M,1907-10-13,2705,HEATHER31@HOTMAIL.COM +356,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-10-01,WILLIAM THOMAS,M,1979-02-27,3061,HOUSEALEX@GMAIL.COM +357,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-10-01,FRANK NUNEZ,M,1945-06-13,8316,RALPH78@GMAIL.COM +358,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-10-01,BRENDA MARTIN,F,1965-05-07,2156,GTHOMAS@HOTMAIL.COM +359,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-10-01,DAWN BAILEY,F,1998-09-29,3304,KYLEFARRELL@HOTMAIL.COM +360,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-10-01,MISS TINA GILLESPIE MD,F,1992-01-29,7105,XREEVES@HOTMAIL.COM +361,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-10-01,AMBER GLENN,F,1939-12-06,2745,CHRISTYADAMS@GMAIL.COM +362,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-10-01,WILLIAM OSBORN,M,1955-12-10,7600,MSCOTT@GMAIL.COM +363,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-10-02,MICHAEL THOMPSON,M,2012-03-25,5465,SUSANJAMES@YAHOO.COM +364,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-10-02,JAMES ROMERO,M,1936-04-17,1617,TRANALEXANDRA@GMAIL.COM +365,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-10-02,JOHN ADAMS,M,1940-10-17,8144,KTORRES@YAHOO.COM +366,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-10-02,BRITTANY HERNANDEZ,F,1939-07-21,7318,JLONG@HOTMAIL.COM +367,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-10-02,MR. BRIAN LAMBERT,M,1951-03-29,8144,TVELAZQUEZ@HOTMAIL.COM +368,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-10-02,CHRISTOPHER THOMPSON,M,2016-03-24,4616,DUNCANROBERT@HOTMAIL.COM +369,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-10-02,SABRINA THOMPSON,F,1987-05-19,2732,WATKINSCARLOS@YAHOO.COM +370,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-10-02,MATTHEW HUFF,M,1978-06-25,2617,OBURCH@HOTMAIL.COM +371,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-10-02,IAN MURPHY,M,1981-12-02,1854,FDAVIS@HOTMAIL.COM +372,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-10-02,MICHELLE PARKER,F,1972-10-30,2134,VICKIE13@YAHOO.COM +373,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-10-03,MISS RACHEL RICH,F,1917-03-28,7221,SHEILA33@YAHOO.COM +374,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-10-03,DENISE RAMIREZ,F,1961-03-30,6239,REBECCARAY@GMAIL.COM +375,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-10-03,ANDREW WILLIAMS,M,1999-03-02,5439,DEANBRUCE@YAHOO.COM +376,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-10-03,MARIA MILLER,F,1964-02-07,2843,ERICKSONJESSICA@GMAIL.COM +377,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-10-03,TOM FLETCHER,M,1961-01-16,7110,RODNEY68@YAHOO.COM +378,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-10-03,STEPHANIE WATKINS,F,1945-09-06,5427,BLAKEMICHAEL@YAHOO.COM +379,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-10-03,JASON JACKSON,M,2010-05-28,8122,WCAIN@GMAIL.COM +380,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-10-03,BREANNA WOLF,F,2017-01-01,5609,PATRICKGREGORY@YAHOO.COM +381,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-10-03,EDWARD BROWN,M,1926-09-17,2732,DOMINIC11@HOTMAIL.COM +382,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-10-03,JACOB HAWKINS,M,1949-10-28,2806,OSBORNESTEVEN@GMAIL.COM +383,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-10-03,KARA LONG,F,1968-03-27,3340,ADAMSCOLLEEN@HOTMAIL.COM +384,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-10-03,JAMES CLAY,M,1910-11-17,4719,MARYKELLY@GMAIL.COM +385,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-10-03,RYAN CAMPBELL,M,1910-03-25,7545,ROBERT79@HOTMAIL.COM +386,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-10-04,NICOLE OCONNOR,F,1993-12-18,5438,TONYA62@YAHOO.COM +387,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-10-04,JUSTIN CHEN,M,2010-03-16,5595,AJOHNSON@YAHOO.COM +388,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-10-04,DANIEL JORDAN,M,1969-01-19,2214,SHATFIELD@HOTMAIL.COM +389,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-10-04,CHRISTINA ARIAS,F,1993-03-07,3522,ZSUMMERS@GMAIL.COM +390,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-10-04,BRITTANY MARTIN,F,1943-12-02,2900,HENRYAMBER@HOTMAIL.COM +391,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-10-04,EMILY AYALA,F,1918-12-11,6438,PORTERSUSAN@GMAIL.COM +392,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-10-04,MR. PHILIP SALINAS,M,1948-08-30,6009,TMARQUEZ@HOTMAIL.COM +393,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-10-05,GABRIELA MCGRATH,F,1971-10-13,2253,ALEXISANDERSON@HOTMAIL.COM +394,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-10-05,CATHY LONG,F,1994-09-10,3317,NDAVIS@GMAIL.COM +395,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-10-05,WILLIE BRADLEY,M,1907-09-29,3254,ZGILL@HOTMAIL.COM +396,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-10-05,MARY WALLACE,F,1992-09-26,3401,COXMARY@HOTMAIL.COM +397,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-10-05,JESSICA FRANCIS,F,2001-09-09,7517,MELISSA16@GMAIL.COM +398,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-10-05,ANTHONY COMPTON,M,1967-09-14,6555,NATALIECRAWFORD@YAHOO.COM +399,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-10-05,CASEY LEWIS,M,1938-08-24,3445,JOHNSONCHRISTIAN@YAHOO.COM +400,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-10-05,JEREMY MORRIS,M,1930-12-25,1603,MISTY51@HOTMAIL.COM +401,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-10-05,MISTY COLON,F,2015-08-07,5563,KCAMPBELL@GMAIL.COM +402,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-10-05,KYLE SMITH,M,1964-05-23,5634,KYLEMARTIN@GMAIL.COM +403,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-10-05,JASMINE SALAZAR,F,2019-09-13,3425,CAMERONSTEPHANIE@GMAIL.COM +404,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-10-05,RACHEL VELEZ,F,1970-05-04,8349,POWELLCHRISTOPHER@HOTMAIL.COM +405,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-10-05,ANITA FERNANDEZ,F,2014-07-22,2943,JONESKRISTEN@GMAIL.COM +406,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-10-05,TYLER ROSS,M,1983-10-28,3261,TANNERYOLANDA@HOTMAIL.COM +407,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-10-05,NANCY MCPHERSON MD,F,1914-09-02,4648,JOELSNYDER@HOTMAIL.COM +408,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-10-05,ERIN HARTMAN,F,1923-11-18,1718,NEWTONMARGARET@HOTMAIL.COM +409,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-10-05,SARAH JOHNSON,F,1934-06-29,6437,DAVIDWILLIAMS@YAHOO.COM +410,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-10-06,MICHAEL PATEL,M,1929-02-05,9220,EMILY48@HOTMAIL.COM +411,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-10-06,BARBARA LEE,F,1980-11-26,3518,STOKESDEVON@YAHOO.COM +412,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-10-06,CHRISTINE STRICKLAND,F,1997-08-21,5590,REBECCAPHILLIPS@HOTMAIL.COM +413,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-10-06,ROGER RAMIREZ,M,2019-01-08,1826,ALEXANDERROBINSON@YAHOO.COM +414,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-10-06,JEFFREY CURTIS,M,1937-10-13,7601,MHENDRICKS@YAHOO.COM +415,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-10-06,JUSTIN HOPKINS,M,1912-01-13,6439,CHANCHRISTINA@HOTMAIL.COM +416,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-10-06,MARCUS HALL,M,1948-04-10,5303,DAVID12@GMAIL.COM +417,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-10-06,TIFFANY GILBERT,F,1946-03-08,2725,YINGRAM@YAHOO.COM +418,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-10-06,BRIAN SMITH,M,1921-12-28,4231,YHENDERSON@HOTMAIL.COM +419,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-10-06,JEFF GONZALES,M,1918-12-10,8322,ROBERT54@GMAIL.COM +420,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-10-06,KIMBERLY BLAIR,F,1940-05-04,2914,ROBERTBRAUN@GMAIL.COM +421,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-10-06,TERRY COX,M,1919-11-22,5719,GALVANCYNTHIA@HOTMAIL.COM +422,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-10-06,BRIAN HUBER,M,2006-03-04,1739,MWARREN@YAHOO.COM +423,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-10-06,APRIL RODRIGUEZ,F,1925-03-30,1640,YLEE@YAHOO.COM +424,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-10-06,RAYMOND COLEMAN,M,1943-06-12,6337,JEFFERY22@YAHOO.COM +425,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-10-06,THOMAS THOMAS,M,1927-09-15,5505,CARRIE51@YAHOO.COM +426,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-10-06,TYLER MORALES,M,1983-08-08,6667,MICHAELHOGAN@GMAIL.COM +427,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-10-07,TIMOTHY KELLER,M,1943-08-25,5605,MMCCALL@HOTMAIL.COM +428,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-10-07,JAKE BROWN,M,1955-08-28,3204,HAYESBENJAMIN@YAHOO.COM +429,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-10-07,MICHAEL COLEMAN,M,1923-06-02,1879,TONI31@GMAIL.COM +430,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-10-07,KENNETH GARCIA,M,1990-09-08,5361,CRAWFORDANGELA@YAHOO.COM +431,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-10-07,LUIS MUELLER,M,1921-03-28,5500,JAMESSANDERS@YAHOO.COM +432,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-10-07,CHRISTINE WATSON,F,1932-10-11,3117,CHARLESTRAN@YAHOO.COM +433,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-10-07,LISA SAUNDERS,F,1948-04-13,4195,YWILLIAMS@HOTMAIL.COM +434,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-10-07,JUAN HOWARD,M,2003-08-27,8300,PTAYLOR@YAHOO.COM +435,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-10-07,ROBERT JONES,M,1981-07-26,2745,GLORIASALINAS@GMAIL.COM +436,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-10-07,MELANIE MAXWELL,F,1976-02-12,8503,FRAZIERKARA@GMAIL.COM +437,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-10-07,ANNE MARQUEZ,F,1922-09-16,4743,TIFFANY19@GMAIL.COM +438,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-10-07,VICTORIA FORD,F,1931-11-17,6058,DANAGOODWIN@HOTMAIL.COM +439,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-10-07,PAUL DANIELS,M,2021-03-19,1763,CARTERCASEY@GMAIL.COM +440,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-10-07,TERRANCE MARTIN,M,1975-03-24,8415,WATKINSCLAIRE@HOTMAIL.COM +441,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-10-07,CAROL SHAW,F,1916-10-03,9101,LINDSEY45@GMAIL.COM +442,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-10-07,CAROLYN BAKER,F,1952-02-01,4653,QINGRAM@HOTMAIL.COM +443,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-10-07,MR. ROBERT GARCIA MD,M,1991-03-30,2600,JAMESSMITH@HOTMAIL.COM +444,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-10-07,JESSICA HANCOCK,F,1950-01-22,6614,SANCHEZCARL@HOTMAIL.COM +445,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-10-08,MARY GONZALEZ,F,1963-03-04,6063,SUSANJONES@YAHOO.COM +446,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-10-08,THOMAS FERGUSON,M,1963-05-28,3133,RRAMOS@GMAIL.COM +447,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-10-08,MR. JOSHUA HERNANDEZ MD,M,1992-09-05,3183,JESSICADAVIS@YAHOO.COM +448,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-10-08,KATIE WASHINGTON,F,1962-02-07,6341,LINDA72@YAHOO.COM +449,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-10-08,MATTHEW FOX,M,2011-06-12,5612,ALYSSARODRIGUEZ@YAHOO.COM +450,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-10-08,JASMINE RODRIGUEZ,F,2016-03-05,4632,LPRATT@YAHOO.COM +451,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-10-08,JACOB COPELAND,M,1965-01-27,2500,GREGORYDOUGHERTY@GMAIL.COM +452,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-10-08,JULIE GARCIA,F,1963-12-07,5577,DANIEL38@HOTMAIL.COM +453,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-10-08,WILLIAM THOMAS,M,1935-02-20,4159,OROBINSON@YAHOO.COM +454,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-10-08,AUSTIN SAUNDERS,M,1910-07-26,6450,CRUZMICHAEL@GMAIL.COM +455,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-10-08,DAVID FERGUSON,M,1917-09-19,2187,SGILBERT@GMAIL.COM +456,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-10-08,GLORIA SMITH,F,1943-03-30,2846,JMILLER@YAHOO.COM +457,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-10-09,MICHAEL OLIVER,M,1916-10-09,6621,THOMASSTEPHANIE@GMAIL.COM +458,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-10-09,KATHRYN VALDEZ,F,1925-04-17,2743,TINAWOLF@HOTMAIL.COM +459,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-10-09,BELINDA WILLIS,F,1985-03-29,6701,GOLDENRYAN@HOTMAIL.COM +460,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-10-09,JASON HAYNES,M,2021-06-16,2208,MULLINSSEAN@GMAIL.COM +461,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-10-09,ALEXANDRIA BLACK,F,1935-01-07,5265,BILLY87@YAHOO.COM +462,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-10-09,IAN MORRIS,M,1906-04-27,1895,YGONZALES@GMAIL.COM +463,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-10-09,GLEN REILLY,M,1990-04-27,6214,VFERNANDEZ@YAHOO.COM +464,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-10-09,DAVID DUDLEY,M,1956-12-26,5333,YOUNGDAVID@HOTMAIL.COM +465,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-10-10,TRACY JOHNSON,F,1934-10-12,4709,MICHAEL34@GMAIL.COM +466,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-10-10,MATTHEW VAUGHN,M,1973-12-14,3080,MSANCHEZ@YAHOO.COM +467,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-10-10,CRYSTAL RAY,F,1906-02-17,7404,SHORTANGELA@YAHOO.COM +468,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-10-10,VICTORIA HOWE,F,1948-02-20,2115,MARGARETSMITH@HOTMAIL.COM +469,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-10-10,JAY HOLLAND,M,1975-05-21,7623,DUSTIN47@GMAIL.COM +470,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-10-10,ALLISON MCLAUGHLIN,F,2007-02-06,3587,YODERMARIA@GMAIL.COM +471,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-10-10,AARON LYONS,M,1938-06-19,2600,MHUTCHINSON@YAHOO.COM +472,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-10-10,BRANDI MAHONEY,F,1943-08-17,1676,MARK87@GMAIL.COM +473,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-10-10,KRISTINA WELCH,F,2013-06-12,7011,BROWNLAWRENCE@HOTMAIL.COM +474,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-10-10,AMY BONILLA,F,1910-10-17,2347,ERIKA40@GMAIL.COM +475,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-10-10,JASON WILSON,M,1987-10-28,9033,HEATHERGAMBLE@YAHOO.COM +476,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-10-11,CODY HUNT MD,M,1967-01-15,3214,KEITH37@HOTMAIL.COM +477,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-10-11,ANTHONY FERNANDEZ,M,1958-09-24,3463,GREGORYHOFFMAN@YAHOO.COM +478,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-10-11,DR. DUANE CAMPBELL MD,M,2021-03-20,1647,JAMESMOORE@YAHOO.COM +479,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-10-11,JAMES GATES,M,1943-12-07,5265,CHRISTOPHER21@GMAIL.COM +480,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-10-11,WESLEY HARRIS,M,1995-07-18,5545,DOUGLASMARTIN@GMAIL.COM +481,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-10-11,DEREK WADE,M,1948-01-27,2821,TIFFANYPEREZ@GMAIL.COM +482,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-10-11,DESTINY GARCIA,F,1994-11-27,5460,BRANDTDAVID@YAHOO.COM +483,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-10-12,CHELSEA FLETCHER,F,1997-04-14,2764,KMORENO@HOTMAIL.COM +484,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-10-12,CHASE HICKS,M,1930-07-07,7607,AMBER24@HOTMAIL.COM +485,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-10-12,RACHEL MILLS,F,1972-07-03,1980,ANDREW99@YAHOO.COM +486,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-10-12,JEREMY JOHNSON,M,1941-02-21,2340,SCOTTBAXTER@GMAIL.COM +487,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-10-12,APRIL THOMAS,F,1916-01-17,6337,ERIN38@YAHOO.COM +488,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-10-12,ROBERTA WHEELER,F,1996-01-24,4709,ELIZABETHNICHOLS@YAHOO.COM +489,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-10-12,CAROLINE THOMPSON,F,1915-09-08,2854,SOLISAMY@YAHOO.COM +490,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-10-12,OSCAR MILLER,M,2013-07-13,8175,PMANN@HOTMAIL.COM +491,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-10-12,JASON LEWIS,M,1965-03-29,9050,TMCMAHON@GMAIL.COM +492,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-10-12,ALAN MARTINEZ,M,1928-03-09,1718,BROWNJUSTIN@YAHOO.COM +493,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-10-12,ERIN NICHOLS,F,1983-11-10,9207,SEAN31@GMAIL.COM +494,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-10-12,JULIE DECKER,F,1978-10-27,3194,ROBERTGOODWIN@GMAIL.COM +495,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-10-12,CARLA WAGNER,F,1935-11-27,2109,SHEENA43@GMAIL.COM +496,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-10-13,CINDY ADAMS,F,1982-05-15,2505,LEWISDUANE@YAHOO.COM +497,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-10-13,KIMBERLY POOLE,F,1914-10-02,5601,UOCONNOR@HOTMAIL.COM +498,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-10-13,ANN SMITH,F,1947-03-11,3023,WRIGHTWILLIAM@HOTMAIL.COM +499,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-10-13,LISA COLLIER,F,1926-05-28,6634,CASESTACEY@YAHOO.COM +500,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-10-13,CATHERINE GARCIA,F,1966-09-28,7167,YGARCIA@GMAIL.COM +501,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-10-13,JASON WHITE,M,1915-01-11,7201,BIRDSARA@HOTMAIL.COM +502,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-10-13,JUAN SANCHEZ,M,1967-08-10,1617,AIMEE12@YAHOO.COM +503,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-10-13,KYLE MATA,M,1997-11-05,5609,GARCIASEAN@HOTMAIL.COM +504,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-10-13,JESSICA GRAVES,F,1921-03-09,6651,RODRIGUEZWILLIAM@GMAIL.COM +505,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-10-13,ERIC WILSON,M,1935-06-09,3541,JEFFREYMONTGOMERY@HOTMAIL.COM +506,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-10-13,SANDRA JONES,F,1972-11-08,3316,MORRISMICHAEL@GMAIL.COM +507,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-10-13,BRANDON JONES,M,2018-08-27,2845,MJACKSON@GMAIL.COM +508,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-10-13,TERRY RODRIGUEZ,M,2007-08-15,6007,LISAJOHNSTON@YAHOO.COM +509,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-10-13,SUSAN WOLF,F,1930-04-30,5615,CROSS@YAHOO.COM +510,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-10-13,JEFFREY CAMPBELL,M,1957-09-12,3337,PAULCARROLL@GMAIL.COM +511,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-10-14,PAULA SCOTT,F,1965-11-28,2173,NICHOLAS30@GMAIL.COM +512,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-10-14,MISTY MURPHY,F,1906-09-24,9411,BRADLEYALEXANDER@GMAIL.COM +513,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-10-14,DIANE BLACK,F,1967-02-04,4231,WILLIAMRICE@HOTMAIL.COM +514,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-10-14,BRIANNA WILLIAMS,F,1981-11-25,4601,DAVIDMILLER@GMAIL.COM +515,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-10-14,MARISSA MARTINEZ,F,1928-05-10,1885,LISANEAL@HOTMAIL.COM +516,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-10-14,JONATHON WILSON,M,1980-10-13,3501,KKENNEDY@YAHOO.COM +517,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-10-14,STEVE BENDER,M,1964-03-14,4235,LROGERS@GMAIL.COM +518,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-10-14,BARBARA SPEARS,F,1971-02-25,6433,CINDY96@HOTMAIL.COM +519,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-10-14,CONNIE DUNCAN,F,1985-08-06,5584,PPARSONS@YAHOO.COM +520,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-10-14,MELISSA BROWNING,F,2019-03-20,2709,MICHELLE02@HOTMAIL.COM +521,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-10-15,NICOLE WILLIAMS,F,1968-12-23,5735,PAMELASOTO@HOTMAIL.COM +522,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-10-15,NATALIE SCHAEFER,F,2019-08-07,1776,GRACE96@HOTMAIL.COM +523,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-10-15,ALYSSA LAM,F,1907-06-23,5881,ANTONIO84@YAHOO.COM +524,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-10-15,ELIZABETH HARRIS,F,1966-09-05,1847,MCARR@YAHOO.COM +525,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-10-15,MATTHEW BARTON DDS,M,1937-10-30,5587,RYANHARPER@GMAIL.COM +526,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-10-15,CHRISTOPHER LEE,M,1910-10-28,8174,FARMERJOHNNY@YAHOO.COM +527,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-10-15,JULIE WARREN,F,1948-04-29,9050,ALEJANDRO81@GMAIL.COM +528,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-10-15,STACEY GARCIA,F,1953-08-10,3220,JANE46@HOTMAIL.COM +529,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-10-15,RICHARD FIELDS,M,1970-12-26,7607,OROZCOJOHN@HOTMAIL.COM +530,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-10-15,DUSTIN FREY,M,1920-07-05,3269,DANIELLEHARMON@HOTMAIL.COM +531,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-10-15,WENDY REYES,F,2004-11-05,6058,KELLYBRITTANY@GMAIL.COM +532,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-10-16,COURTNEY PACE,F,1926-09-24,8101,JELLIS@HOTMAIL.COM +533,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-10-16,FREDERICK FLETCHER,M,2003-03-26,7220,MATTHEW01@GMAIL.COM +534,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-10-16,TRACY WEEKS DDS,F,2003-02-23,1676,ROBERTROCHA@GMAIL.COM +535,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-10-16,MARK POWELL,M,1956-04-02,4122,KIRSTEN42@GMAIL.COM +536,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-10-16,DAVID FORD,M,1980-08-31,3371,ANGELAMORA@HOTMAIL.COM +537,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-10-16,JOHN WILSON,M,2013-09-12,3052,JOHN88@YAHOO.COM +538,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-10-16,NICHOLAS HARRIS,M,2012-09-04,8403,SPENCERJOSE@YAHOO.COM +539,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-10-16,KATHY ROJAS,F,1953-09-14,4146,PLUNA@HOTMAIL.COM +540,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-10-16,TREVOR FRANKLIN,M,2015-02-13,7263,DANIELHINES@YAHOO.COM +541,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-10-16,JOANNE LEWIS,F,2012-06-20,4606,VCARNEY@GMAIL.COM +542,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-10-16,MR. JEREMY PETERSEN,M,1954-03-02,5276,TAMMY85@HOTMAIL.COM +543,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-10-17,DORIS DAVIS,F,1968-09-18,3532,DANIELLEJOHNSON@YAHOO.COM +544,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-10-17,ANDREW SMITH,M,1965-11-02,3136,KCOLEMAN@YAHOO.COM +545,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-10-17,MELISSA YOUNG,F,1946-10-29,6616,REBECCA05@HOTMAIL.COM +546,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-10-17,JOE HORNE MD,M,1985-04-25,1682,ROBERTBENNETT@YAHOO.COM +547,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-10-17,SUSAN MALDONADO,F,2000-11-07,5400,ASHLEY87@HOTMAIL.COM +548,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-10-17,COURTNEY BRENNAN,F,1977-09-25,3199,ROSESHARP@GMAIL.COM +549,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-10-17,ANTHONY THOMPSON,M,2011-03-09,6530,NICHOLASGILL@HOTMAIL.COM +550,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-10-17,MARTHA JOHNSON,F,1959-01-01,3366,LUIS60@GMAIL.COM +551,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-10-17,APRIL ROTH,F,1928-04-30,6411,SUSAN58@YAHOO.COM +552,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-10-17,NICHOLE REYES,F,2014-10-25,6311,BETHANYSTANLEY@GMAIL.COM +553,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-10-17,JONATHAN BAIRD,M,1925-09-13,3066,GLORIAARROYO@YAHOO.COM +554,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-10-17,CAROL NELSON,F,1952-02-05,3332,BRANDTJASON@YAHOO.COM +555,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-10-17,TRACY WELLS,F,1982-06-13,8203,THOMPSONBRADLEY@YAHOO.COM +556,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-10-17,JOHN JOHNSON,M,1915-04-05,7265,HOWEHEATHER@HOTMAIL.COM +557,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-10-17,DEREK WARREN,M,2008-09-06,3531,UMOORE@HOTMAIL.COM +558,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-10-18,NICOLE WHITAKER,F,1920-01-17,7112,KCARTER@YAHOO.COM +559,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-10-18,KAREN KING,F,2009-04-05,6018,SARAH48@GMAIL.COM +560,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-10-18,CHRISTOPHER MARTINEZ,M,1923-04-08,6513,MICHAEL37@HOTMAIL.COM +561,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-10-18,HEATHER TERRELL,F,1978-12-13,6239,XREED@YAHOO.COM +562,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-10-18,RICKY GARCIA,M,1984-05-28,6070,DBALL@YAHOO.COM +563,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-10-18,MS. HEATHER MARTINEZ,F,2014-06-30,8336,BGARCIA@GMAIL.COM +564,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-10-18,SAMANTHA BERNARD,F,1983-05-03,1815,HEATHERLEE@YAHOO.COM +565,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-10-18,HECTOR REYES,M,1959-12-02,5591,RMARTINEZ@GMAIL.COM +566,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-10-18,TIMOTHY GIBSON,M,2013-07-20,6050,CHRISTOPHEREVANS@GMAIL.COM +567,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-10-18,ALLEN RAMIREZ,M,1946-04-04,4168,SULLIVANRYAN@GMAIL.COM +568,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-10-18,JOSEPH MATA,M,1967-03-06,6305,ZBARTLETT@HOTMAIL.COM +569,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-10-18,SARAH SHAFFER,F,2010-11-18,1636,MELANIE86@GMAIL.COM +570,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-10-18,JOHN LEE,M,1918-08-23,4147,SAUNDERSAMY@YAHOO.COM +571,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-10-19,JULIA SMITH,F,1960-09-22,2806,JAMES31@HOTMAIL.COM +572,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-10-19,ANGELA MULLINS,F,1973-09-12,2103,KENTJILL@GMAIL.COM +573,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-10-19,PETER SPENCER,M,2014-07-24,6001,DONNAVALDEZ@HOTMAIL.COM +574,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-10-19,STEPHANIE BENJAMIN,F,1994-05-21,1744,AGOODMAN@YAHOO.COM +575,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-10-19,MATTHEW HUGHES,M,1969-09-13,6665,MCGUIRELAURA@YAHOO.COM +576,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-10-19,SONIA SANDERS,F,1922-04-27,7408,CHRISTOPHER59@HOTMAIL.COM +577,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-10-19,MR. THOMAS DEAN MD,M,1926-12-08,1774,FSMITH@YAHOO.COM +578,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-10-19,STEPHEN GONZALEZ,M,1999-10-30,5636,QMORA@GMAIL.COM +579,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-10-19,MICHAEL LUNA,M,1999-10-27,8117,JAMES83@HOTMAIL.COM +580,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-10-19,TIMOTHY WOOD,M,1954-01-17,4101,MALDONADOMICHAEL@YAHOO.COM +581,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-10-19,CHARLES TAYLOR,M,1957-03-24,4242,RENEE64@HOTMAIL.COM +582,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-10-19,CASSANDRA SERRANO,F,1993-09-26,8000,AARONLOVE@HOTMAIL.COM +583,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-10-20,CHRISTOPHER NORMAN,M,1959-09-20,3326,MILLERTIMOTHY@YAHOO.COM +584,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-10-20,BRENDA GAMBLE,F,2001-01-24,4134,ANGEL72@GMAIL.COM +585,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-10-20,PHILIP WANG,M,1914-03-23,8416,LIUKATHRYN@YAHOO.COM +586,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-10-20,AUTUMN MCGEE,F,1931-11-20,8133,FDOYLE@HOTMAIL.COM +587,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-10-20,DANIEL GLENN,M,1988-03-18,3586,PJOHNSON@HOTMAIL.COM +588,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-10-20,BENJAMIN LOPEZ,M,1964-01-27,1686,JOHNSONREBECCA@GMAIL.COM +589,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-10-20,KAITLYN STRONG,F,2018-10-18,4147,TNICHOLS@YAHOO.COM +590,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-10-20,JOEL DORSEY,M,1933-04-19,5595,CHRISTOPHER37@GMAIL.COM +591,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-10-20,THERESA SCOTT,F,2021-05-22,1872,MIRANDALARSON@YAHOO.COM +592,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-10-20,COLLEEN RODRIGUEZ,F,2007-11-15,6070,WADECHERYL@GMAIL.COM +593,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-10-20,CHRISTINA NELSON,F,1980-02-19,8134,FBENNETT@GMAIL.COM +594,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-10-20,BRYAN COPELAND,M,1963-08-02,6605,JSNYDER@GMAIL.COM +595,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-10-20,MELINDA WALTER,F,1953-07-29,8111,BUSHBRETT@YAHOO.COM +596,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-10-21,JOSE NAVARRO,M,1987-02-21,4633,FWEAVER@HOTMAIL.COM +597,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-10-21,TAMMY GIBSON,F,1944-04-17,6417,JOHN91@HOTMAIL.COM +598,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-10-21,KEVIN PEREZ,M,1996-09-23,4137,RASMUSSENLUIS@YAHOO.COM +599,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-10-21,JOSHUA PATTERSON,M,1974-12-07,7208,BAILEYROSE@YAHOO.COM +600,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-10-21,KAYLA HALL,F,1986-09-27,4705,JACK59@HOTMAIL.COM +601,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-10-21,MICHAEL CHASE,M,2000-10-20,6075,MILLERAARON@YAHOO.COM +602,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-10-21,MICHELE MOONEY,F,1932-01-27,3586,MICHAELLEON@GMAIL.COM +603,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-10-21,SIERRA KAISER,F,1940-05-08,2508,SARAH66@YAHOO.COM +604,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-10-21,MARY PEREZ,F,1929-04-13,2745,MZIMMERMAN@GMAIL.COM +605,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-10-21,ROBERT MENDOZA,M,1917-03-29,8373,CASTANEDADALTON@YAHOO.COM +606,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-10-21,KELLY BAUER,F,2007-07-17,3265,CCOLEMAN@HOTMAIL.COM +607,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-10-21,JACQUELINE INGRAM,F,1940-07-06,5529,JOSEPH84@HOTMAIL.COM +608,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-10-22,AMANDA WILLIAMS,F,1957-09-18,1735,EADAMS@YAHOO.COM +609,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-10-22,CHRISTOPHER PALMER,M,2015-11-29,1911,SARAH42@GMAIL.COM +610,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-10-22,NATALIE LOWE,F,1920-10-05,6277,ANN54@GMAIL.COM +611,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-10-22,BENJAMIN LEE,M,1943-06-18,8172,ECOX@HOTMAIL.COM +612,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-10-22,EMILY BAKER,F,1944-09-06,5365,ROBERT98@YAHOO.COM +613,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-10-22,SPENCER CHRISTIAN,M,1990-01-28,2743,STEVEN06@HOTMAIL.COM +614,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-10-22,JASON MAYS,M,1912-12-18,2204,MCNEILDANIEL@HOTMAIL.COM +615,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-10-22,DEBORAH WOODS,F,2007-03-26,2705,LITTLESHANNON@YAHOO.COM +616,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-10-22,JACKIE GARRETT,F,1947-08-30,3056,ASHLEY35@YAHOO.COM +617,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-10-22,MR. MIKE JOHNSON,M,1987-05-21,3337,COLEJAMIE@YAHOO.COM +618,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-10-22,VANESSA WALTON,F,2009-05-24,9310,KHOLLOWAY@GMAIL.COM +619,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-10-22,VICTORIA DIXON,F,2000-08-08,7517,JOHN81@YAHOO.COM +620,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-10-22,ALEXIS THOMPSON,F,1954-10-13,2200,KENGLISH@GMAIL.COM +621,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-10-23,GABRIEL DAWSON,M,1981-08-05,7212,RICHARDWILLIAMS@GMAIL.COM +622,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-10-23,PARKER SHAW,M,2011-08-10,6652,JOHNSONPATRICIA@HOTMAIL.COM +623,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-10-23,SEAN ZIMMERMAN,M,1983-09-23,4184,CYNTHIA55@HOTMAIL.COM +624,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-10-23,JUSTIN MCMILLAN,M,1993-01-19,4242,NJIMENEZ@HOTMAIL.COM +625,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-10-23,MATTHEW STEPHENSON,M,2020-09-05,3020,TANNER43@YAHOO.COM +626,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-10-23,JEREMY BLACKBURN,M,2003-06-15,5303,BLAKE46@GMAIL.COM +627,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-10-23,RAYMOND MORRIS,M,1973-07-10,7637,DAVISKARI@YAHOO.COM +628,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-10-23,LAURA GIBSON,F,1938-12-03,3087,CARMENMCKINNEY@YAHOO.COM +629,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-10-23,DEBRA SCOTT,F,1958-04-29,6389,HSAMPSON@GMAIL.COM +630,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-10-23,DR. LAWRENCE STANLEY DDS,M,1965-01-12,7531,RYAN81@YAHOO.COM +631,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-10-23,PATRICK GRAY,M,2017-09-05,2403,REBEKAH02@GMAIL.COM +632,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-10-23,DAVID SINGH,M,1934-11-18,3516,FBAKER@HOTMAIL.COM +633,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-10-23,DAVID ERICKSON,M,2012-01-08,2814,CASEYBURGESS@YAHOO.COM +634,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-10-24,CYNTHIA RODGERS,F,1974-10-14,3386,JOHNSONJASON@YAHOO.COM +635,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-10-24,KENDRA ADAMS,F,1914-12-05,2713,NATHANIEL92@YAHOO.COM +636,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-10-24,RYAN FITZGERALD,M,2010-06-25,5357,FOWLERMORGAN@YAHOO.COM +637,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-10-24,MR. TROY MEJIA,M,1958-04-02,2144,COFFEYLATOYA@GMAIL.COM +638,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-10-24,JAMES ANDERSON,M,1995-10-15,5600,HRIVERA@YAHOO.COM +639,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-10-24,CHRISTINE BLACKBURN,F,1908-01-04,4504,ZJENNINGS@YAHOO.COM +640,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-10-24,BRETT CASTILLO,M,2000-06-21,6551,MOLLYBAKER@YAHOO.COM +641,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-10-24,SPENCER CAMPBELL,M,1959-03-02,5596,APRIL21@YAHOO.COM +642,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-10-24,JUSTIN SALINAS,M,1917-03-31,3005,PATRICIA51@HOTMAIL.COM +643,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-10-24,SARAH WILLIAMS,F,2012-01-22,2728,WILLIAMREED@GMAIL.COM +644,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-10-24,PATTY PEREZ,F,1911-11-21,1895,MMOORE@GMAIL.COM +645,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-10-25,KEVIN DRAKE,M,1925-07-19,3543,OROBINSON@HOTMAIL.COM +646,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-10-25,BRETT FERGUSON,M,1994-02-22,3300,MMCKENZIE@GMAIL.COM +647,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-10-25,SARAH LOWE,F,1949-11-12,1886,JAMESTHOMPSON@GMAIL.COM +648,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-10-25,MICHAEL ORTIZ,M,1939-05-15,3448,WBOWMAN@HOTMAIL.COM +649,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-10-25,SHANNON WEBER,F,1973-11-20,2635,ASHLEYMCGEE@YAHOO.COM +650,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-10-25,JAMES LEBLANC,M,2013-11-11,6476,CARROLLSTEPHEN@YAHOO.COM +651,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-10-25,CHRISTINE BRADFORD,F,1967-08-19,2111,LOGANPATRICK@YAHOO.COM +652,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-10-25,MARY WATERS,F,1953-05-20,8322,BDOMINGUEZ@YAHOO.COM +653,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-10-25,PAUL PETTY,M,1945-05-16,5405,CARRILLOHENRY@HOTMAIL.COM +654,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-10-25,SCOTT SHARP,M,2010-05-04,4133,MORGANWHITNEY@YAHOO.COM +655,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-10-25,MEGAN WILSON,F,1907-02-09,7513,WOODSTEPHANIE@YAHOO.COM +656,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-10-25,ALLISON MILLER,F,1976-08-13,8181,AALVAREZ@GMAIL.COM +657,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-10-25,ANDREA HARDIN,F,1932-09-26,5637,DBROWN@YAHOO.COM +658,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-10-25,DENISE GRAY,F,1918-07-23,2754,REEDJONATHAN@GMAIL.COM +659,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-10-25,VERONICA TORRES,F,1917-01-19,9200,JOHN69@GMAIL.COM +660,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-10-25,ETHAN HOPKINS,M,1927-12-31,3009,BRADSHAWSHANNON@YAHOO.COM +661,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-10-25,JOSEPH JOHNSON,M,1984-03-11,3137,DANIELREYNOLDS@HOTMAIL.COM +662,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-10-25,MOLLY CLARK,F,1916-02-20,8126,CHRISTOPHER24@YAHOO.COM +663,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-10-25,MELVIN ANTHONY,M,1921-07-12,7240,KEYANNA@HOTMAIL.COM +664,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-10-25,NICOLE JONES,F,1966-01-07,8204,DEANMICHELLE@YAHOO.COM +665,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-10-26,MICHELE BECK,F,1938-02-01,6608,VERONICABAKER@GMAIL.COM +666,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-10-26,DR. MEREDITH FISHER,F,1939-02-03,9111,LGRIFFITH@HOTMAIL.COM +667,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-10-26,LINDA BRADLEY,F,1956-07-07,3400,KATHLEENMILLER@HOTMAIL.COM +668,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-10-26,SELENA MAYS,F,1957-02-10,6105,ZJAMES@GMAIL.COM +669,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-10-26,JASON KING MD,M,2010-12-25,2445,ADAM27@HOTMAIL.COM +670,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-10-26,DEBRA TODD,F,1930-01-11,6509,GREGORYBECK@HOTMAIL.COM +671,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-10-26,LISA THOMPSON,F,2008-07-14,4135,FIGUEROAERICA@YAHOO.COM +672,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-10-26,COLTON BARRETT,M,1926-09-15,5431,ZHUDSON@YAHOO.COM +673,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-10-26,MEGAN PALMER,F,2000-07-28,8200,JOSEPHROBINSON@HOTMAIL.COM +674,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-10-26,ELLEN JACOBS,F,1973-03-03,3581,PEGGY98@YAHOO.COM +675,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-10-26,DIANE JONES,F,1931-05-21,3162,CARLBLACK@HOTMAIL.COM +676,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-10-26,DEREK JONES,M,1997-07-21,5517,EMILYMCCULLOUGH@HOTMAIL.COM +677,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-10-27,KIMBERLY GUZMAN,F,1984-04-04,6346,VMCKNIGHT@HOTMAIL.COM +678,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-10-27,LAURA HARRIS,F,1970-07-16,5275,WOODLARRY@GMAIL.COM +679,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-10-27,COREY RHODES,M,1988-07-28,6051,LOPEZSUSAN@GMAIL.COM +680,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-10-27,ROBERT CAMERON,M,1966-06-11,2156,DENISEELLIOTT@GMAIL.COM +681,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-10-27,MR. ROBERT BAILEY,M,1922-02-07,5300,YMITCHELL@GMAIL.COM +682,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-10-27,DANIEL RODGERS,M,1963-08-13,6065,CHENSON@HOTMAIL.COM +683,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-10-27,DONALD HARRELL,M,1978-12-26,8353,MOORECARLOS@YAHOO.COM +684,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-10-27,REBECCA BASS,F,1987-07-15,2722,MELISSASMITH@HOTMAIL.COM +685,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-10-27,JOHN ARMSTRONG,M,1980-08-24,2400,JENNIFER88@GMAIL.COM +686,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-10-27,CHARLES YORK,M,1916-12-15,3009,MICHELLEWOODS@HOTMAIL.COM +687,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-10-28,VICTORIA BRADLEY,F,2011-08-17,1834,AMBERSMITH@HOTMAIL.COM +688,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-10-28,JESSICA COX,F,1911-04-18,2930,FRANKDAVID@HOTMAIL.COM +689,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-10-28,SUSAN AYERS,F,1907-10-01,3378,ZMARKS@HOTMAIL.COM +690,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-10-28,MICHAEL PALMER,M,2003-04-15,3374,ANNEFLORES@GMAIL.COM +691,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-10-28,DAVID DIAZ,M,1999-09-27,3170,RHONDA46@YAHOO.COM +692,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-10-28,ANGELICA GOMEZ,F,2005-06-28,7150,MARY97@YAHOO.COM +693,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-10-28,SYDNEY JONES,F,1983-05-27,4146,AUTUMN85@YAHOO.COM +694,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-10-28,TIMOTHY ROGERS,M,1945-07-14,3187,CCUNNINGHAM@YAHOO.COM +695,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-10-28,WILLIAM MCBRIDE,M,2010-10-15,2720,SHEPARDCALEB@YAHOO.COM +696,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-10-28,MICHELE GILBERT,F,1946-09-12,2635,VLOGAN@HOTMAIL.COM +697,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-10-29,PHILIP NGUYEN,M,1968-05-08,3470,CHRISTINE03@YAHOO.COM +698,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-10-29,RACHEL GONZALEZ,F,1961-03-02,3133,DANIEL74@GMAIL.COM +699,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-10-29,DOUGLAS CASTRO,M,1924-03-28,6605,OMURPHY@YAHOO.COM +700,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-10-29,MARCUS EVANS,M,1911-11-06,5609,CAMPOSTIFFANY@HOTMAIL.COM +701,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-10-29,LAURA FREY,F,1967-09-02,6607,SCOTT46@HOTMAIL.COM +702,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-10-29,PHILLIP SMITH,M,1951-07-26,1778,KJONES@YAHOO.COM +703,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-10-29,GERALD MILLER,M,1990-12-15,6315,JACOBSTHOMAS@GMAIL.COM +704,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-10-29,JAMES TORRES,M,1982-05-14,9019,VJARVIS@YAHOO.COM +705,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-10-29,JUSTIN ADAMS,M,1931-03-25,3526,TODD55@YAHOO.COM +706,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-10-29,CHRISTOPHER GAINES,M,1954-12-15,2740,BRITTANYMONTGOMERY@GMAIL.COM +707,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-10-29,PETER RAMOS,M,2020-01-18,7517,XORTEGA@HOTMAIL.COM +708,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-10-29,AARON SIMS,M,1984-04-19,5276,MSMITH@GMAIL.COM +709,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-10-29,DAN PEREZ,M,1935-07-24,7000,JESSICAVASQUEZ@YAHOO.COM +710,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-10-29,CHLOE LAMBERT,F,2018-10-21,5421,KATHERINE72@GMAIL.COM +711,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-10-29,BETH GRAY,F,1951-03-11,3113,SONYA51@YAHOO.COM +712,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-10-30,DARLENE BAXTER,F,1934-08-11,4139,ROBERTCLARK@YAHOO.COM +713,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-10-30,DAWN ANDERSON,F,1969-03-17,6605,PEREZMICHAEL@HOTMAIL.COM +714,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-10-30,GINA RUIZ,F,1938-08-24,5591,ANDERSONDANIELLE@GMAIL.COM +715,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-10-30,REBECCA HENDERSON,F,1931-07-05,1644,FMASON@GMAIL.COM +716,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-10-30,BRETT GARCIA,M,2020-12-31,2813,CLARKNICHOLE@GMAIL.COM +717,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-10-30,JENNA DIAZ,F,1940-08-18,9000,NBURNS@HOTMAIL.COM +718,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-10-30,JILL GARDNER,F,1966-09-25,2443,JASONCHRISTENSEN@GMAIL.COM +719,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-10-30,ANGELA PERKINS,F,2008-10-30,5507,GMALDONADO@YAHOO.COM +720,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-10-31,AMANDA HILL,F,1990-04-08,8129,TYLER57@HOTMAIL.COM +721,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-10-31,ERIK MCDANIEL,M,1920-06-05,3016,KIMBERLYCONTRERAS@YAHOO.COM +722,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-10-31,CHELSEA SIMPSON,F,1946-07-21,2241,RWOOD@YAHOO.COM +723,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-10-31,MARK MIDDLETON,M,1941-11-17,5713,RHODESELIZABETH@YAHOO.COM +724,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-10-31,DEBORAH BISHOP,F,2016-12-25,3232,QALVAREZ@YAHOO.COM +725,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-10-31,ZACHARY JORDAN,M,1958-05-16,1742,JACQUELINE73@HOTMAIL.COM +726,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-10-31,BRIDGET JAMES,F,1998-10-31,4624,HARRISONRANDALL@GMAIL.COM +727,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-10-31,TIMOTHY COSTA,M,1929-09-23,5384,ZHERNANDEZ@YAHOO.COM +728,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-10-31,NICHOLAS FLORES,M,1972-08-08,8500,JASON54@YAHOO.COM +729,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-10-31,ANNA DAVIS,F,1923-09-10,3194,DEBORAH18@HOTMAIL.COM +730,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-10-31,CHRISTOPHER WRIGHT,M,1973-03-02,6471,TERESASMITH@HOTMAIL.COM +731,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-11-01,RAYMOND CRAIG,M,1962-09-12,5707,SARAH15@HOTMAIL.COM +732,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-11-01,VICTORIA HARPER,F,1952-08-31,3463,APRIL98@YAHOO.COM +733,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-11-01,CORY DAVIS,M,1963-12-28,3730,JAMIE28@YAHOO.COM +734,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-11-01,MEGAN SMITH,F,1982-10-19,7201,COREY28@HOTMAIL.COM +735,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-11-01,SAMANTHA HARPER,F,2005-02-03,1765,ASMITH@HOTMAIL.COM +736,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-11-01,MARISSA GOMEZ,F,1978-05-21,2718,JASMINEMORRISON@YAHOO.COM +737,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-11-02,DR. NANCY WARREN DDS,F,2011-04-03,2347,NCOOK@GMAIL.COM +738,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-11-02,SEAN WEISS,M,1933-04-09,2916,DANARODRIGUEZ@GMAIL.COM +739,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-11-02,JARED FARLEY,M,1978-05-12,7511,UJOHNSON@GMAIL.COM +740,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-11-02,ANDREW BERG,M,2004-08-19,3048,CHARLESGARCIA@HOTMAIL.COM +741,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-11-02,DARRYL FREEMAN,M,1991-09-29,9011,LYNCHDENISE@HOTMAIL.COM +742,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-11-02,WILLIAM MORGAN,M,1987-08-11,8146,MILLSDUSTIN@HOTMAIL.COM +743,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-11-02,TAYLOR HARMON,F,1950-12-28,3322,PETER57@HOTMAIL.COM +744,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-11-02,ASHLEY MCKINNEY,F,2004-08-20,3338,KDANIELS@GMAIL.COM +745,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-11-02,ALEXANDER DURHAM,M,1958-04-27,2352,ALAN12@HOTMAIL.COM +746,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-11-02,CARL THOMAS,M,1986-10-28,3700,OTATE@HOTMAIL.COM +747,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-11-02,SCOTT YOUNG,M,1923-06-26,9013,STEVEN97@HOTMAIL.COM +748,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-11-03,JOSEPH FISCHER,M,2006-01-29,6360,RAYMOND31@YAHOO.COM +749,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-11-03,ALEJANDRA WILLIAMS,F,1970-05-28,1842,ADAM54@YAHOO.COM +750,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-11-03,ANDREW WALKER,M,1958-09-04,9315,DIANA62@YAHOO.COM +751,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-11-03,ROBERT SCOTT,M,1929-02-07,6233,JDUKE@YAHOO.COM +752,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-11-03,COREY MCCOY,M,1968-11-23,4178,DMILLER@GMAIL.COM +753,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-11-03,BRANDY PATTERSON,F,1911-09-23,3414,SIMPSONCHRISTOPHER@YAHOO.COM +754,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-11-03,BRENT THOMAS,M,2019-06-13,2824,NANCYMILLER@HOTMAIL.COM +755,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-11-03,LORI YOUNG,F,1936-10-27,9050,EGARZA@GMAIL.COM +756,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-11-03,DAVID GOLDEN,M,1941-11-04,1804,LFOSTER@YAHOO.COM +757,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-11-03,TAYLOR FOLEY,F,1949-09-23,3470,ANDREWCOX@HOTMAIL.COM +758,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-11-03,EMILY RHODES,F,1955-04-22,8200,NICOLE72@HOTMAIL.COM +759,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-11-03,STEPHEN BROWN,M,1995-03-17,1712,JENNIFER93@YAHOO.COM +760,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-11-03,DANIEL FORD,M,2006-12-02,6746,JUSTIN96@GMAIL.COM +761,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-11-03,MADISON BAILEY,F,1932-04-21,5735,SHELLY85@HOTMAIL.COM +762,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-11-04,KATHY MILLS,F,1932-06-12,5365,OBUCKLEY@HOTMAIL.COM +763,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-11-04,AMY ROBINSON,F,2012-04-10,6326,SHEILA53@YAHOO.COM +764,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-11-04,KELLY GLENN,F,1999-06-02,2147,MICHAELROBINSON@HOTMAIL.COM +765,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-11-04,ARTHUR RODRIGUEZ,M,1986-09-18,2105,PAMELAGARCIA@HOTMAIL.COM +766,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-11-04,DARRELL ROBINSON,M,1952-06-05,3016,JAMESSCHNEIDER@HOTMAIL.COM +767,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-11-04,REBECCA WILLIAMS,F,1928-12-01,5383,ANTHONYBROWN@YAHOO.COM +768,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-11-04,ERICA POOLE,F,1919-11-20,7313,JOHNSONKENNETH@GMAIL.COM +769,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-11-04,GINA BRIGHT,F,1931-03-25,2751,ZOECHAMBERS@GMAIL.COM +770,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-11-04,ROGER FERRELL,M,1954-02-20,5573,WGALLEGOS@GMAIL.COM +771,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-11-04,JOAN BALDWIN,F,1958-01-25,6725,FREYES@YAHOO.COM +772,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-11-04,RUBEN KING,M,1931-12-28,4163,JORDANTERRY@GMAIL.COM +773,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-11-04,THOMAS BENNETT,M,2021-05-15,8324,TARA84@HOTMAIL.COM +774,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-11-04,JOSHUA BROWN,M,1986-04-20,8132,FJONES@YAHOO.COM +775,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-11-04,JAMIE PORTER,F,1953-11-24,3425,BRANDON55@GMAIL.COM +776,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-11-04,AMY HOOVER,F,1912-11-17,3248,HOBBSSABRINA@GMAIL.COM +777,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-11-04,MR. KIRK RIOS DDS,M,1955-06-23,3350,KVAUGHN@HOTMAIL.COM +778,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-11-04,MICHELLE LONG,F,1936-04-24,5881,BOWMANBRENDA@HOTMAIL.COM +779,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-11-05,RICHARD FLORES,M,1994-03-14,2342,GJOHNSON@YAHOO.COM +780,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-11-05,NANCY RODRIGUEZ,F,1925-01-01,4650,CHRISTINEBARRETT@HOTMAIL.COM +781,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-11-05,DR. ANTHONY MORRIS,M,1971-12-09,3144,NATHANWALLER@HOTMAIL.COM +782,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-11-05,RACHEL ABBOTT,F,1926-02-05,3222,BARNESJUSTIN@GMAIL.COM +783,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-11-05,ROBERT GARCIA,M,1976-07-02,5511,SPENCERTHOMAS@HOTMAIL.COM +784,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-11-05,DENNIS FREEMAN,M,2010-08-15,7305,CHRISTOPHERRAMIREZ@GMAIL.COM +785,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-11-05,CHRISTOPHER SMITH,M,2010-12-14,5306,MIRANDAWALKER@GMAIL.COM +786,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-11-05,BETHANY WALTON,F,1940-08-02,1657,CARLA96@HOTMAIL.COM +787,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-11-05,BETHANY WOLFE,F,1979-01-25,4713,KIMBERLYELLIOTT@HOTMAIL.COM +788,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-11-05,JOSHUA BOYD,M,2010-04-13,6634,GERALD01@HOTMAIL.COM +789,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-11-05,JOSHUA STOKES,M,1947-07-15,5701,JENNIFER73@GMAIL.COM +790,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-11-05,WANDA DOWNS,F,1985-02-07,1613,EHARRIS@GMAIL.COM +791,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-11-05,THOMAS MOORE,M,1964-05-27,8341,STEPHANIEBARRON@YAHOO.COM +792,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-11-05,JAMES GOLDEN,M,1929-03-02,5569,KEVINHESS@GMAIL.COM +793,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-11-06,ROBERT HICKS,M,1917-08-01,8521,THALL@YAHOO.COM +794,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-11-06,KRISTEN DAVIS,F,1950-10-04,7226,ANTHONYJOHNSON@YAHOO.COM +795,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-11-06,RICHARD SMITH,M,1960-12-27,1682,ANNAMARTINEZ@YAHOO.COM +796,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-11-06,JOE DAVIS,M,1917-05-07,3229,CARLAROBERTS@HOTMAIL.COM +797,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-11-06,VERONICA FLORES,F,1956-08-25,5751,LISACOLLINS@HOTMAIL.COM +798,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-11-06,CASEY MURPHY,M,1955-11-01,3206,STEPHANIE85@YAHOO.COM +799,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-11-06,CARLOS GARZA,M,1989-02-25,3216,HAYNESLARRY@GMAIL.COM +800,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-11-06,MATTHEW THOMAS,M,1994-04-05,5325,JGLASS@YAHOO.COM +801,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-11-06,MARGARET HOLT,F,1928-03-01,5615,GARZAHEATHER@GMAIL.COM +802,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-11-06,LISA KAISER,F,1961-07-02,4741,KENNETHFLORES@GMAIL.COM +803,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-11-06,ALLEN TURNER,M,1970-11-25,6628,SETHBRENNAN@GMAIL.COM +804,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-11-07,MICHAEL YOUNG,M,1968-04-19,6203,KGILLESPIE@YAHOO.COM +805,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-11-07,THOMAS LOPEZ,M,1945-10-05,2240,PATRICIAFISHER@HOTMAIL.COM +806,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-11-07,ALYSSA GARZA,F,1920-04-20,3450,MARKBALLARD@YAHOO.COM +807,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-11-07,ALICIA ROSS,F,1929-08-14,3425,DANIEL83@HOTMAIL.COM +808,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-11-07,MANUEL KING,M,1987-10-10,4230,MICHELLEPERRY@GMAIL.COM +809,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-11-07,LINDA CHRISTENSEN,F,1998-09-25,3703,MICHELLELAMBERT@YAHOO.COM +810,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-11-07,LORI BARRETT,F,1963-08-06,9003,BRIGGSJEFFERY@HOTMAIL.COM +811,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-11-07,REBECCA OLSON,F,1993-05-02,3589,KIMBERLY98@GMAIL.COM +812,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-11-07,KYLE HARVEY,M,1998-02-15,7630,VILLANUEVAJUSTIN@YAHOO.COM +813,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-11-07,NATALIE WILLIAMS,F,1933-03-07,7507,PBUCK@HOTMAIL.COM +814,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-11-07,MICHELE RODRIGUEZ,F,1957-04-16,6009,ANDRADEJEFF@YAHOO.COM +815,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-11-07,BETH BROWN,F,1911-04-23,2520,VJOHNSON@GMAIL.COM +816,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-11-08,MICHELE CUEVAS,F,1973-10-12,3405,SWEENEYROBERT@YAHOO.COM +817,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-11-08,ALICIA RUIZ,F,1920-02-23,8308,SANDRA43@YAHOO.COM +818,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-11-08,THOMAS FLETCHER,M,1935-12-19,1826,MATTHEW98@GMAIL.COM +819,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-11-08,TERESA SMITH,F,2004-04-02,8532,JEFFREY58@HOTMAIL.COM +820,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-11-08,NICHOLAS MATTHEWS,M,2018-10-14,2000,MICHAELARELLANO@YAHOO.COM +821,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-11-08,CHRISTOPHER GRAVES,M,2001-02-21,1852,KEITH86@HOTMAIL.COM +822,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-11-08,MICHAEL DAVIS,M,2008-06-01,2813,TAYLORPRICE@HOTMAIL.COM +823,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-11-08,JENNIFER LIVINGSTON,F,1980-11-07,9053,CHARLES64@HOTMAIL.COM +824,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-11-09,KIMBERLY HARRIS,F,1994-11-19,5621,WBROWN@HOTMAIL.COM +825,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-11-09,KRISTINE COLEMAN,F,1976-07-30,3412,DANACOLE@YAHOO.COM +826,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-11-09,CHRISTINE FOWLER,F,1930-07-29,3203,SARADAY@GMAIL.COM +827,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-11-09,JERRY VELEZ,M,1994-03-15,3188,GONZALEZJEFFERY@YAHOO.COM +828,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-11-09,CHRISTINA SMITH,F,1978-01-13,2828,STEPHANIE41@HOTMAIL.COM +829,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-11-09,CHRISTOPHER RODRIGUEZ,M,2006-09-20,6352,LJONES@YAHOO.COM +830,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-11-09,MICHAEL SMITH,M,1936-09-16,1889,MELANIEBRADLEY@HOTMAIL.COM +831,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-11-09,MELINDA GORDON,F,1990-08-07,3344,RICHARDLOZANO@HOTMAIL.COM +832,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-11-09,SHELBY PENNINGTON,F,1981-08-02,6703,CHRISTOPHER83@HOTMAIL.COM +833,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-11-09,HEATHER WILSON,F,1972-03-17,6734,BBROWN@GMAIL.COM +834,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-11-09,LISA BONILLA,F,1929-12-05,4631,ALLENWILLIAM@GMAIL.COM +835,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-11-10,RICHARD BANKS,M,1966-07-14,5735,WBAKER@GMAIL.COM +836,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-11-10,JEFFREY MARTINEZ,M,2016-07-14,5577,MARIAROSS@GMAIL.COM +837,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-11-10,SHERRY WILLIAMS,F,2017-05-16,5427,MACKTHOMAS@YAHOO.COM +838,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-11-10,JOSE RILEY,M,2009-04-01,5557,HPARKER@GMAIL.COM +839,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-11-10,ALFRED CLARK,M,2007-02-20,3448,EKHAN@HOTMAIL.COM +840,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-11-10,STACY MARTINEZ,F,2006-04-01,1617,DAVID65@GMAIL.COM +841,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-11-10,CINDY RYAN,F,2020-07-06,6031,MILLERERIKA@HOTMAIL.COM +842,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-11-10,CONNOR GREGORY,M,1938-05-07,3222,ANGELA79@YAHOO.COM +843,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-11-10,BIANCA KENT,F,1971-05-26,3733,GWALLS@GMAIL.COM +844,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-11-10,MICHELLE SMITH,F,1989-10-16,6101,SMITHANNA@HOTMAIL.COM +845,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-11-10,BRANDON MACK,M,1964-07-24,5329,KNIGHTJEFFREY@YAHOO.COM +846,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-11-10,MICHELLE BASS,F,1949-05-27,6557,ROBERT67@GMAIL.COM +847,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-11-10,MICHAEL BOYD,M,1926-12-29,2173,EMILYCHAPMAN@GMAIL.COM +848,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-11-10,GARY HARPER,M,2021-01-27,2255,CCAMPBELL@HOTMAIL.COM +849,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-11-11,MR. STEVEN EVANS JR.,M,1995-02-10,8166,ARMSTRONGBRANDON@YAHOO.COM +850,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-11-11,JENNIFER MCLEAN,F,2018-11-21,1702,MARKANDERSON@YAHOO.COM +851,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-11-11,ANDREW WILLIAMS,M,1914-07-05,4640,SAMANTHAMILLER@GMAIL.COM +852,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-11-11,KYLE ALLEN,M,2011-01-10,6474,CHRISTOPHER88@HOTMAIL.COM +853,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-11-11,LANCE WARD,M,2009-02-26,3448,NATALIE49@GMAIL.COM +854,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-11-11,RYAN BERRY,M,1910-01-01,9107,ROBERTSMITH@GMAIL.COM +855,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-11-11,SUSAN PATTERSON,F,1937-04-10,2349,TURNERALICIA@HOTMAIL.COM +856,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-11-12,MICHAEL ARELLANO,M,1961-07-28,3309,REIDKAYLA@HOTMAIL.COM +857,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-11-12,MADISON BRENNAN,F,1933-11-22,3100,CHRISTOPHERSMITH@HOTMAIL.COM +858,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-11-12,MICHELLE HARRIS,F,1968-02-11,8187,DAVID24@YAHOO.COM +859,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-11-12,MICHAEL OLIVER,M,1906-07-11,3592,BBUSH@YAHOO.COM +860,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-11-12,DARIN PEREZ,M,2001-06-07,3575,ALLISONKING@GMAIL.COM +861,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-11-12,JOSEPH THOMAS,M,2003-03-26,3132,WILLIAMSMARY@YAHOO.COM +862,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-11-12,CYNTHIA CLARK,F,2019-01-29,3400,KCLARK@GMAIL.COM +863,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-11-12,GORDON HUNTER,M,1966-04-20,2915,COLLINSWENDY@GMAIL.COM +864,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-11-12,RENEE DAY,F,1981-11-21,9001,WBLACK@GMAIL.COM +865,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-11-12,AMY FRANK,F,1968-06-06,2944,QCOOK@HOTMAIL.COM +866,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-11-12,RYAN ESPINOZA,M,1911-10-24,3016,TORRESCHRISTINA@YAHOO.COM +867,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-11-12,TABITHA GARCIA,F,2010-08-11,3081,LMCDONALD@HOTMAIL.COM +868,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-11-12,BRENDA KING,F,1912-07-06,2324,JONATHAN60@GMAIL.COM +869,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-11-12,MICHELLE ROBERTS,F,1938-06-05,9207,MARTINJAMES@YAHOO.COM +870,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-11-13,PATRICK ALLEN,M,1916-10-30,5585,GSCOTT@YAHOO.COM +871,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-11-13,MELISSA KRUEGER,F,1909-12-18,2943,JOHNHOGAN@YAHOO.COM +872,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-11-13,MICHAEL JACOBS,M,1997-01-27,2248,BRIAN58@YAHOO.COM +873,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-11-13,ASHLEY GREEN,F,2019-01-14,2527,CHRISTIAN68@YAHOO.COM +874,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-11-13,DOROTHY WARD,F,1927-07-25,4151,HARPERCHRISTINE@HOTMAIL.COM +875,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-11-13,COREY ARROYO,M,1924-01-03,4101,FSMITH@HOTMAIL.COM +876,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-11-13,JOSEPH YANG,M,1953-04-24,6339,ROSSRAYMOND@GMAIL.COM +877,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-11-13,VICKIE DAVIS,F,1917-10-15,6438,HARTJULIE@GMAIL.COM +878,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-11-13,JESSE KENT,M,1937-01-05,1884,HANSONMARIA@YAHOO.COM +879,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-11-13,JANET WHITE,F,1921-02-15,4111,QGIBSON@YAHOO.COM +880,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-11-13,NICOLE MURRAY,F,2002-01-19,7612,CADAMS@HOTMAIL.COM +881,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-11-13,JOSEPH LARSEN,M,1994-11-09,2170,MARYMARTINEZ@HOTMAIL.COM +882,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-11-13,NANCY HUGHES,F,1913-08-17,5442,EVANCOOPER@YAHOO.COM +883,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-11-13,LACEY LAWRENCE,F,1941-06-09,8534,NGUYENBRENDA@YAHOO.COM +884,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-11-13,JESSICA DELACRUZ,F,1972-02-09,2322,MARTINHUNT@YAHOO.COM +885,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-11-13,ADAM MOORE,M,1957-02-12,1665,BRANDON66@HOTMAIL.COM +886,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-11-13,RODNEY THOMPSON,M,1992-06-18,3453,UROBERTSON@HOTMAIL.COM +887,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-11-13,DAVID JOHNSON,M,2020-10-14,7535,ERIC52@YAHOO.COM +888,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-11-13,NANCY COLON,F,1965-11-04,2303,NICOLE14@HOTMAIL.COM +889,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-11-14,DAVID TODD,M,1974-10-03,2407,SHAWN12@HOTMAIL.COM +890,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-11-14,THERESA JOSEPH,F,1989-09-14,3100,RODRIGUEZRHONDA@YAHOO.COM +891,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-11-14,JACOB HODGES,M,1936-05-20,9400,ROBERT74@GMAIL.COM +892,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-11-14,DEBRA TAYLOR,F,2012-08-18,6228,CBURGESS@HOTMAIL.COM +893,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-11-14,ANN EDWARDS,F,1989-03-17,6383,WALKERPETER@HOTMAIL.COM +894,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-11-14,SONIA FOSTER,F,1928-08-22,6000,YOUNGJEFFERY@GMAIL.COM +895,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-11-14,REBECCA JOHNSON,F,2002-02-23,6723,DAVID74@HOTMAIL.COM +896,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-11-14,WESLEY MURRAY,M,1906-09-01,6000,WPACE@GMAIL.COM +897,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-11-14,MEGAN NELSON,F,2016-01-07,2635,JASON60@YAHOO.COM +898,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-11-14,SCOTT BARRY,M,2007-10-20,6614,VMARTIN@YAHOO.COM +899,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-11-15,BRITTANY ADAMS,F,1907-04-29,8307,CLAIREBUTLER@HOTMAIL.COM +900,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-11-15,ZACHARY PACHECO,M,1984-10-01,3466,ZHARDY@YAHOO.COM +901,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-11-15,BETH STEWART,F,1921-02-12,2529,FGREGORY@HOTMAIL.COM +902,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-11-15,JULIA MCGEE,F,1975-04-06,8305,MILLERRHONDA@GMAIL.COM +903,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-11-15,GLENN BURNS,M,1979-12-27,3144,UMARTINEZ@YAHOO.COM +904,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-11-15,ELIZABETH RODRIGUEZ,F,1923-10-05,2942,TIFFANYMOSES@YAHOO.COM +905,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-11-15,ROBERT YOUNG,M,1915-01-02,2349,TROY50@YAHOO.COM +906,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-11-15,JASMINE STEIN,F,1918-07-23,2405,JHESTER@YAHOO.COM +907,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-11-15,KARA ADAMS,F,1972-11-05,5473,LISA26@GMAIL.COM +908,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-11-16,RICHARD JACOBS,M,1926-05-20,1911,JENNIFER18@YAHOO.COM +909,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-11-16,ELIZABETH WANG,F,1987-05-12,6213,JAIME22@HOTMAIL.COM +910,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-11-16,AMY POWELL,F,2013-12-12,2852,BETHWALKER@GMAIL.COM +911,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-11-16,MICHAEL BAXTER,M,1934-04-23,5584,GREGORY78@HOTMAIL.COM +912,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-11-16,STACEY SPEARS,F,1995-07-20,7009,ROBERT87@YAHOO.COM +913,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-11-16,DANIEL COBB,M,1997-06-08,6434,SALVARADO@GMAIL.COM +914,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-11-16,ASHLEY MACK,F,1917-06-06,3357,WATERSMELISSA@HOTMAIL.COM +915,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-11-16,TRACY JOHNSON,F,1945-10-04,8336,REBECCA95@GMAIL.COM +916,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-11-16,JAMES PARKER,M,1949-07-29,1702,JESSICA21@HOTMAIL.COM +917,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-11-16,ASHLEY DIAZ,F,1998-12-31,8431,BRIANFITZGERALD@HOTMAIL.COM +918,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-11-17,ADRIANA HERNANDEZ,F,1906-01-23,5345,KIMBERLYMILLER@HOTMAIL.COM +919,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-11-17,JASON FORD,M,2013-11-29,5460,JONESKEVIN@GMAIL.COM +920,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-11-17,JONATHAN BROWN,M,1947-07-03,7108,LAURIE15@GMAIL.COM +921,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-11-17,ABIGAIL CALDWELL,F,1971-09-03,2700,MARKGRANT@YAHOO.COM +922,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-11-17,TIMOTHY PAYNE,M,1983-09-19,9201,VANESSAGARCIA@GMAIL.COM +923,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-11-17,MICHAEL KIM,M,1934-07-28,3722,NSCHROEDER@YAHOO.COM +924,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-11-17,SHELLY GENTRY,F,1908-06-19,9011,NATHANGARCIA@GMAIL.COM +925,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-11-17,JENNIFER DUNN,F,1923-09-22,6407,JOHN08@HOTMAIL.COM +926,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-11-17,REBECCA VELAZQUEZ,F,1965-02-04,5759,MEGANLLOYD@HOTMAIL.COM +927,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-11-18,PAUL LIVINGSTON,M,2020-03-24,9041,LGARCIA@YAHOO.COM +928,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-11-18,JAMES TRAVIS,M,2013-02-16,6385,PALMERMATTHEW@GMAIL.COM +929,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-11-18,TYLER ODOM,M,1910-04-22,3474,NCARTER@GMAIL.COM +930,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-11-18,CHRISTOPHER SANDOVAL,M,1966-12-08,6660,KYLE46@GMAIL.COM +931,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-11-18,JOHN THOMPSON,M,1971-01-10,5465,FLETCHERKYLE@HOTMAIL.COM +932,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-11-18,CHAD JORDAN,M,2006-04-10,3226,KATHY90@GMAIL.COM +933,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-11-18,TIMOTHY WINTERS,M,1973-04-01,7511,BROCKMARK@YAHOO.COM +934,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-11-19,JENNIFER WILSON,F,1975-10-20,2415,KELLY65@HOTMAIL.COM +935,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-11-19,THERESA ANDERSON,F,1940-02-19,6003,AGREENE@YAHOO.COM +936,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-11-19,HAROLD MASON,M,1949-06-10,1925,DEANTHOMAS@YAHOO.COM +937,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-11-19,RACHAEL RAMIREZ,F,1953-03-03,6463,JERRY93@GMAIL.COM +938,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-11-19,JORDAN ANDERSON,F,2003-11-28,7249,GBERRY@YAHOO.COM +939,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-11-19,SANDRA HERNANDEZ,F,1974-01-22,3485,LIJACOB@YAHOO.COM +940,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-11-19,CYNTHIA CASTILLO,F,1977-01-24,2111,SHAFFERTRAVIS@HOTMAIL.COM +941,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-11-19,PAMELA BENJAMIN,F,1941-02-03,1651,ADRIANA75@HOTMAIL.COM +942,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-11-19,CYNTHIA HOLLOWAY,F,1949-06-19,5343,BLAIRCALEB@HOTMAIL.COM +943,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-11-19,SHARON ADAMS,F,1961-09-10,5773,AMANDA92@HOTMAIL.COM +944,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-11-19,MELISSA ROBERTSON,F,1992-11-24,7630,JOSEPHKING@GMAIL.COM +945,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-11-19,DOROTHY GARNER,F,1936-09-14,9039,DANIEL36@GMAIL.COM +946,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-11-19,HARRY WARREN,M,1995-09-22,7303,MALIK20@GMAIL.COM +947,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-11-19,WILLIAM HODGES,M,1997-09-10,3174,JAMES78@YAHOO.COM +948,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-11-19,DUSTIN BOYD,M,1931-08-29,2146,CHERYLSCHMIDT@YAHOO.COM +949,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-11-20,MICHELLE HARRIS,F,1917-10-13,7261,MARTINEZJOHN@HOTMAIL.COM +950,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-11-20,DEBRA KIRK,F,1945-12-12,5555,TDAVIS@HOTMAIL.COM +951,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-11-20,SHERI ROSS,F,1956-07-22,4750,MILLERANA@HOTMAIL.COM +952,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-11-20,DANIEL KLEIN,M,1945-03-28,5327,JDAVIS@GMAIL.COM +953,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-11-20,ROBIN HUGHES,F,2009-12-24,5632,THORNTONJAMES@GMAIL.COM +954,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-11-20,DAVID MORALES,M,1943-07-31,2846,FROBINSON@GMAIL.COM +955,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-11-20,JAMES REED,M,1998-10-04,3641,EBARRETT@HOTMAIL.COM +956,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-11-20,RICHARD TYLER,M,1931-11-02,4512,SHANE42@GMAIL.COM +957,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-11-20,STEPHANIE MURPHY,F,1925-10-08,8503,DDUNCAN@YAHOO.COM +958,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-11-20,TROY JOHNSON,M,1934-08-28,6625,LISA42@HOTMAIL.COM +959,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-11-20,CHELSEA HATFIELD,F,1959-04-27,4740,ALEXISMARSHALL@GMAIL.COM +960,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-11-21,FRANK MILLER,M,1919-09-11,5357,EPHILLIPS@GMAIL.COM +961,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-11-21,FRANCIS BELL,M,2002-09-11,4135,XBROOKS@HOTMAIL.COM +962,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-11-21,AMANDA HINES,F,1990-08-06,7607,BENSONMICHAEL@GMAIL.COM +963,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-11-21,REBECCA CARTER,F,1963-07-02,7635,ERIC78@YAHOO.COM +964,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-11-21,DONNA CLARK,F,1930-02-07,6505,SANCHEZREBECCA@HOTMAIL.COM +965,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-11-21,CARRIE DAVIS,F,2005-03-08,4158,ZKHAN@GMAIL.COM +966,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-11-21,AMBER EDWARDS,F,1922-04-29,2315,DUNNWILLIAM@GMAIL.COM +967,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-11-21,DENNIS BARNES,M,1954-07-11,1882,YOUNGAARON@GMAIL.COM +968,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-11-21,CARLA LONG,F,1909-02-22,5340,DANIELDAVIDSON@GMAIL.COM +969,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-11-21,NICHOLAS MAYNARD,M,1938-02-05,3734,DDAVIS@HOTMAIL.COM +970,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-11-22,VALERIE SANDERS,F,1994-07-03,1667,JEFFREYSMITH@GMAIL.COM +971,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-11-22,DEBRA PRICE,F,1992-11-17,5609,WILLIAMHORN@HOTMAIL.COM +972,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-11-22,NICOLE GARCIA,F,1993-02-09,4632,DANIELLE04@GMAIL.COM +973,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-11-22,ELIZABETH ORTIZ,F,1945-07-10,4626,VSCOTT@HOTMAIL.COM +974,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-11-22,KARLA ANDERSON,F,1997-12-04,5575,FCABRERA@HOTMAIL.COM +975,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-11-22,DANIEL ROBERTS,M,1978-06-12,1651,XMORRIS@YAHOO.COM +976,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-11-22,CORY KELLY,M,1948-02-24,7507,RUSSELLAMY@GMAIL.COM +977,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-11-22,CHRIS MILLER,M,1991-07-16,8340,CASEYSHARON@YAHOO.COM +978,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-11-22,MICHELLE MORA,F,1931-11-15,5507,SMITHALAN@YAHOO.COM +979,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-11-22,MATTHEW COLON,M,1944-05-22,6213,PIERCENICOLAS@GMAIL.COM +980,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-11-23,ALAN SCOTT,M,1919-04-13,3029,BOWMANDOUGLAS@GMAIL.COM +981,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-11-23,JASON SCOTT,M,1939-07-13,5615,CHERYLGOODWIN@YAHOO.COM +982,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-11-23,MICHAEL NGUYEN,M,1972-12-16,6073,BRYAN31@GMAIL.COM +983,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-11-23,TAMMY SMITH,F,2008-07-03,6743,YLEE@HOTMAIL.COM +984,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-11-23,CHRISTOPHER GARCIA,M,1981-11-26,1602,HOLLANDALEXANDER@HOTMAIL.COM +985,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-11-23,JASON JAMES,M,1960-08-17,3574,NICHOLAS57@GMAIL.COM +986,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-11-23,DONNA CHAPMAN,F,1935-04-27,3224,SCOTTHERRERA@GMAIL.COM +987,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-11-23,DAVID MILLER,M,1973-02-19,3048,PTRAN@YAHOO.COM +988,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-11-24,AMANDA VAUGHN,F,1914-08-18,7261,CHRISTOPHERCOLEMAN@GMAIL.COM +989,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-11-24,FERNANDO MUNOZ,M,2010-03-01,7136,MACDONALDSARAH@HOTMAIL.COM +990,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-11-24,CAMERON MAY,M,1945-10-25,8126,LDEAN@HOTMAIL.COM +991,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-11-24,APRIL BURNS,F,1954-01-30,1748,RCARR@YAHOO.COM +992,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-11-24,MIKE PETERSON,M,1927-02-16,4612,JOHN90@HOTMAIL.COM +993,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-11-24,BENJAMIN RICE,M,1976-06-12,2443,LJENKINS@GMAIL.COM +994,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-11-24,JOHN ROBERTS,M,1957-02-16,2123,HERNANDEZALEXANDER@YAHOO.COM +995,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-11-24,REBEKAH GONZALES,F,1979-01-13,7609,MTERRY@YAHOO.COM +996,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-11-24,JARED DOMINGUEZ,M,1997-02-24,6475,LOPEZKIMBERLY@HOTMAIL.COM +997,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-11-24,GERALD MOORE,M,1994-04-09,1890,JEFFERY98@GMAIL.COM +998,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-11-24,AMY FLORES,F,1954-08-27,2848,YRODRIGUEZ@HOTMAIL.COM +999,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-11-25,RAY CERVANTES,M,1980-07-08,2183,JIMMY39@GMAIL.COM +1000,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-11-25,KEITH NEAL,M,1906-01-19,3045,DVELEZ@HOTMAIL.COM +1001,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-11-25,SHANNON SANDOVAL,F,2021-07-22,2440,ROTHREBECCA@GMAIL.COM +1002,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-11-25,JAMES TAYLOR,M,1939-12-04,1633,TORRESMEGAN@GMAIL.COM +1003,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-11-25,EDWARD MILLER,M,1983-04-28,5773,EBAILEY@HOTMAIL.COM +1004,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-11-25,SHELLY FRAZIER,F,1972-09-18,2117,SYLVIA45@HOTMAIL.COM +1005,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-11-25,DAVID MOORE,M,1919-01-09,8162,MELISSALAMBERT@YAHOO.COM +1006,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-11-25,LATASHA COOK,F,1987-05-17,1665,DEREK68@GMAIL.COM +1007,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-11-25,TERESA MONTOYA,F,1994-03-05,2183,JASONDRAKE@GMAIL.COM +1008,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-11-25,THOMAS BECKER,M,1930-07-26,5345,VSMITH@HOTMAIL.COM +1009,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-11-25,DAVID HARRIS,M,1929-09-17,3485,PATRICIACOLEMAN@YAHOO.COM +1010,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-11-26,JESSE STEELE,M,1912-03-03,2761,USANCHEZ@YAHOO.COM +1011,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-11-26,HEATHER SMITH,F,1928-11-16,3287,KATHLEENBENNETT@GMAIL.COM +1012,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-11-26,STEPHEN GOODMAN,M,1996-02-01,6321,DAVID38@HOTMAIL.COM +1013,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-11-26,KAYLA WATKINS,F,2004-01-08,5444,MICHAELDUNCAN@YAHOO.COM +1014,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-11-26,MATTHEW DIXON,M,2018-12-29,3572,HOWARDALEXANDRA@HOTMAIL.COM +1015,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-11-26,SANDRA MILLER,F,1997-03-09,8118,SUSAN84@HOTMAIL.COM +1016,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-11-26,JAMES SUAREZ,M,2009-07-02,3057,LROGERS@HOTMAIL.COM +1017,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-11-26,NATHAN JAMES,M,2016-09-30,9411,NATHANIELPORTER@HOTMAIL.COM +1018,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-11-26,BRETT HARPER,M,1923-12-04,1661,LKIDD@GMAIL.COM +1019,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-11-26,NICOLE SMITH,F,1912-08-21,5438,HOLLYMEDINA@YAHOO.COM +1020,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-11-26,THOMAS RICHARDSON JR.,M,1986-12-04,8133,LHUGHES@GMAIL.COM +1021,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-11-26,OLIVIA MOLINA,F,1998-01-18,5541,LEEWELLS@YAHOO.COM +1022,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-11-27,CHRISTOPHER DANIELS,M,1951-04-25,2311,SHANNONPETERSON@YAHOO.COM +1023,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-11-27,TERRI KIM,F,1951-02-16,7407,EMARSHALL@HOTMAIL.COM +1024,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-11-27,ANTHONY GEORGE,M,1941-09-05,8536,JOHN53@GMAIL.COM +1025,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-11-27,RODNEY COOPER,M,1950-10-05,5622,TOCHOA@YAHOO.COM +1026,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-11-27,MAUREEN CLARKE,F,2017-11-08,2630,PATRICKGRAY@GMAIL.COM +1027,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-11-27,KENNETH HILL,M,1932-02-23,5363,CHRISTOPHERWRIGHT@GMAIL.COM +1028,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-11-27,KAYLA RODRIGUEZ,F,1946-12-01,2138,NICHOLAS59@YAHOO.COM +1029,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-11-27,DANIEL THOMAS,M,1963-05-14,1727,SJOHNSON@GMAIL.COM +1030,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-11-27,TIMOTHY MITCHELL,M,1943-12-25,5549,UBARNES@HOTMAIL.COM +1031,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-11-27,STEPHANIE STEWART,F,1947-10-17,6305,ARNOLDCRAIG@YAHOO.COM +1032,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-11-27,ELIZABETH GATES,F,1994-02-20,5421,TIMOTHYKING@YAHOO.COM +1033,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-11-27,JOSEPH KNIGHT,M,1956-09-13,6345,DEBRALUNA@GMAIL.COM +1034,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-11-27,MEGAN HAMILTON,F,1976-05-26,5533,SHELTONLACEY@GMAIL.COM +1035,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-11-27,JOSHUA CARROLL,M,1934-02-07,6461,JOANN70@HOTMAIL.COM +1036,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-11-27,MATTHEW NORRIS,M,1919-05-25,3474,TORRESSAMANTHA@YAHOO.COM +1037,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-11-27,BRIAN MURRAY,M,1939-07-17,5359,BARNESJEREMY@GMAIL.COM +1038,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-11-27,SOPHIA HART,F,1998-11-18,2187,LOUISGREER@HOTMAIL.COM +1039,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-11-28,BRIAN ROSS,M,1949-11-04,9023,AEDWARDS@YAHOO.COM +1040,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-11-28,KELSEY DECKER,F,1975-04-30,1659,AWILLIAMS@YAHOO.COM +1041,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-11-28,SUSAN GREEN,F,2016-06-02,9217,DONNA60@YAHOO.COM +1042,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-11-28,FELICIA FOLEY,F,1930-05-27,6550,HLLOYD@HOTMAIL.COM +1043,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-11-28,JESSICA HOLMES,F,2006-06-23,3581,IORTIZ@GMAIL.COM +1044,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-11-28,SAMANTHA GARCIA,F,1908-09-02,2144,HENDRIXRAYMOND@YAHOO.COM +1045,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-11-28,KAREN CONNER,F,1931-08-14,5345,MARKWILSON@YAHOO.COM +1046,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-11-28,DALTON WILLIAMS,M,1983-10-17,6105,EMILY56@YAHOO.COM +1047,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-11-28,KEVIN RAMIREZ,M,2005-08-16,8315,PBRIDGES@HOTMAIL.COM +1048,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-11-28,HUNTER BAKER,M,1966-04-05,4149,ALICIAREILLY@HOTMAIL.COM +1049,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-11-28,DIANA FOSTER,F,1945-01-27,4111,CLYNCH@HOTMAIL.COM +1050,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-11-28,BRUCE WALKER,M,1988-11-23,3540,ACOSTACHELSEA@HOTMAIL.COM +1051,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-11-28,AMBER AGUILAR,F,2008-04-13,4195,GONZALEZHANNAH@GMAIL.COM +1052,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-11-28,JENNIFER JONES,F,1998-12-20,3052,GJOHNSON@GMAIL.COM +1053,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-11-29,IAN WILLIAMS,M,1907-03-12,2812,SARAGARCIA@YAHOO.COM +1054,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-11-29,PAUL SIMS,M,1993-03-20,6628,BRANDIDALTON@HOTMAIL.COM +1055,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-11-29,CRYSTAL GRAY,F,1960-11-27,4618,JEANETTELEONARD@GMAIL.COM +1056,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-11-29,BRIAN EDWARDS,M,1952-12-15,8508,BERNARDBRIAN@GMAIL.COM +1057,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-11-29,DENISE GUZMAN MD,F,1926-08-19,2713,ANDREWSSAMUEL@YAHOO.COM +1058,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-11-29,ANA KEY,F,1977-06-04,6616,RAMOSSTEVEN@GMAIL.COM +1059,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-11-29,WILLIAM CORTEZ,M,2018-11-24,8360,KATHERINE29@YAHOO.COM +1060,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-11-29,GARY MILLER,M,1928-08-15,5411,USMITH@GMAIL.COM +1061,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-11-29,DAVID DILLON,M,1967-07-21,5276,BERGERASHLEY@GMAIL.COM +1062,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-11-29,JENNIFER HANCOCK,F,2015-09-10,3338,JESUS07@HOTMAIL.COM +1063,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-11-29,JORDAN HANSEN,F,1920-05-12,5636,YOUNGCYNTHIA@YAHOO.COM +1064,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-11-29,RONALD LEWIS,M,2003-03-25,8113,STEPHANIE00@HOTMAIL.COM +1065,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-11-29,NANCY CLARK,F,2010-03-25,7167,MATTHEW84@HOTMAIL.COM +1066,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-11-29,DANIEL CERVANTES,M,1970-05-16,1771,FREEMANERICA@YAHOO.COM +1067,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-11-30,MICHAEL PRICE,M,1990-09-09,2743,SHERNANDEZ@HOTMAIL.COM +1068,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-11-30,MICHAEL WHITAKER,M,1957-03-20,8200,PATRICK36@YAHOO.COM +1069,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-11-30,PETER RICHARD,M,1977-02-24,4237,FREEMANJONATHAN@HOTMAIL.COM +1070,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-11-30,ALEXIS SMITH,F,1954-10-20,3585,ALLENTIFFANY@HOTMAIL.COM +1071,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-11-30,PAMELA MYERS,F,1998-03-17,6471,POWELLALEXANDER@YAHOO.COM +1072,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-11-30,NICHOLAS FREEMAN,M,2014-10-14,4626,AMANDASEXTON@GMAIL.COM +1073,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-11-30,JEFF RICE,M,1936-05-24,5319,JENNIFER21@HOTMAIL.COM +1074,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-11-30,CHARLES SMITH,M,1931-02-15,9301,RICHARD35@YAHOO.COM +1075,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-11-30,MARIA JONES,F,1935-12-23,3263,YATESPAULA@YAHOO.COM +1076,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-11-30,ADAM CALDWELL,M,1923-02-02,6660,MOOREDAVID@HOTMAIL.COM +1077,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-11-30,GILBERT SMITH,M,1921-01-29,2705,ERIC84@HOTMAIL.COM +1078,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-11-30,KEITH RICHARDSON,M,1978-12-06,3540,MJOHNSON@YAHOO.COM +1079,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-11-30,DANIEL PARK,M,1972-10-28,8200,GCOLE@HOTMAIL.COM +1080,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-11-30,STEVEN RODGERS,M,1994-05-08,4137,ERIVERA@GMAIL.COM +1081,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-11-30,JULIE CARTER,F,2006-05-05,9020,MWILKERSON@HOTMAIL.COM +1082,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-11-30,KIMBERLY KENT,F,1937-08-12,3176,RODRIGUEZKENNETH@YAHOO.COM +1083,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-12-01,SAMUEL REYES,M,1906-01-11,8313,TIMGUERRA@YAHOO.COM +1084,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-12-01,COURTNEY JOHNSON,F,1945-08-11,3013,VMITCHELL@HOTMAIL.COM +1085,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-12-01,THOMAS MEYERS,M,1910-01-15,5601,NICHOLASBLANKENSHIP@GMAIL.COM +1086,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-12-01,TERRY WHITE,M,2002-11-14,5722,GRAYDEVIN@HOTMAIL.COM +1087,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-12-01,MICHAEL HUNTER,M,2004-04-23,1718,MARK05@YAHOO.COM +1088,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-12-01,RHONDA GREEN,F,1938-07-14,4431,CHASEANTONIO@HOTMAIL.COM +1089,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-12-01,TIMOTHY WILLIAMS,M,1963-11-16,9003,KAREN79@YAHOO.COM +1090,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-12-01,KATHLEEN HAWKINS,F,1948-01-23,3003,CAMPBELLKEVIN@GMAIL.COM +1091,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-12-01,NATHAN BROWN,M,2007-02-11,1746,DANIELLE73@HOTMAIL.COM +1092,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-12-01,LINDA HARRIS,F,1919-09-20,3048,HPATTON@GMAIL.COM +1093,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-12-01,CHRISTIAN CASTILLO,M,1927-11-01,3001,CHRISTINAWEST@YAHOO.COM +1094,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-12-01,AMBER PERKINS,F,1978-08-13,4612,NHARRIS@YAHOO.COM +1095,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-12-01,KELLY NICHOLSON MD,F,1988-07-31,6214,DANIEL55@HOTMAIL.COM +1096,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-12-02,MARK WRIGHT,M,1984-01-14,5750,AUSTIN71@YAHOO.COM +1097,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-12-02,JASON HARPER,M,1930-12-25,5460,UWRIGHT@GMAIL.COM +1098,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-12-02,TANNER ABBOTT,M,1965-09-01,1744,WCRAWFORD@HOTMAIL.COM +1099,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-12-02,JARED SCOTT,M,1907-11-13,3358,LPALMER@YAHOO.COM +1100,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-12-02,CARL LOPEZ MD,M,1942-12-08,6341,ALEXYOUNG@HOTMAIL.COM +1101,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-12-02,AUTUMN BLACK,F,2013-02-18,6476,HJONES@YAHOO.COM +1102,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-12-02,MICHELLE CAMPBELL,F,1982-11-29,5592,HWARD@YAHOO.COM +1103,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-12-02,JAY ELLIS,M,1945-02-20,7305,SMITHJESSICA@GMAIL.COM +1104,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-12-03,PEGGY ADAMS,F,1943-07-17,7163,DEBORAHSMITH@YAHOO.COM +1105,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-12-03,SANDRA BURTON,F,1970-02-12,4500,KLEINLAUREN@GMAIL.COM +1106,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-12-03,MEGAN WRIGHT,F,1970-06-03,8363,LINDA63@HOTMAIL.COM +1107,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-12-03,RICHARD FOSTER,M,1994-08-22,7223,MICHAELBUCHANAN@YAHOO.COM +1108,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-12-03,MRS. EMILY RAMIREZ,F,1948-01-16,2258,TAYLORAMBER@YAHOO.COM +1109,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-12-03,ALEXANDRA MILLER,F,2003-11-28,1864,JOHNSONSHANE@YAHOO.COM +1110,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-12-03,MARK DUDLEY,M,2013-01-06,6203,DON55@YAHOO.COM +1111,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-12-03,DEANNA HILL,F,1985-05-08,1739,VMOYER@GMAIL.COM +1112,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-12-03,CHRISTOPHER HALL,M,2016-01-07,2752,CALEB43@GMAIL.COM +1113,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-12-04,KRYSTAL VELASQUEZ,F,1945-12-06,3555,GGUTIERREZ@YAHOO.COM +1114,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-12-04,DANIEL CLARKE,M,2008-12-10,6239,VSHEPARD@YAHOO.COM +1115,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-12-04,TRAVIS WARD,M,2020-12-29,8212,OCOOPER@HOTMAIL.COM +1116,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-12-04,STEPHEN HARRINGTON,M,1933-01-02,6307,FRANCESMILES@GMAIL.COM +1117,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-12-04,OLIVIA MELTON,F,1958-06-26,7160,TWATKINS@GMAIL.COM +1118,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-12-04,GERALD WEST,M,1945-03-17,6000,LOPEZDESTINY@GMAIL.COM +1119,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-12-04,CAROL WHITE,F,2015-09-02,3532,JAMES89@GMAIL.COM +1120,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-12-04,STEVEN WATTS,M,2006-10-19,9003,EJENKINS@HOTMAIL.COM +1121,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-12-04,MARISSA HENDERSON,F,1984-04-03,7260,GCHAMBERS@YAHOO.COM +1122,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-12-04,KATHY EVANS,F,1948-02-11,5409,CARRIEHERNANDEZ@YAHOO.COM +1123,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-12-04,DANIELLE HERRERA,F,1960-05-26,2512,JOHNWEBB@GMAIL.COM +1124,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-12-04,ALICE MOORE,F,1915-10-24,3177,ESHIELDS@HOTMAIL.COM +1125,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-12-05,DEBORAH NGUYEN,F,1965-05-24,4501,QSCOTT@YAHOO.COM +1126,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-12-05,REBECCA OROZCO,F,2007-06-14,1915,ZFREEMAN@HOTMAIL.COM +1127,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-12-05,JONATHAN ASHLEY,M,1931-12-17,4707,STEVEN16@HOTMAIL.COM +1128,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-12-05,MICHAEL HUBBARD,M,1935-06-29,3133,TAYLORSOLOMON@YAHOO.COM +1129,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-12-05,CODY KRAMER,M,1915-11-30,7601,WHITEJEFFERY@GMAIL.COM +1130,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-12-05,NATHAN GRAHAM,M,1933-12-30,1804,COLLINSCINDY@HOTMAIL.COM +1131,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-12-05,HOLLY LEWIS,F,1917-10-18,3188,GORDONJAMES@HOTMAIL.COM +1132,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-12-05,HEATHER MILLS,F,1935-10-16,3351,RCHAVEZ@YAHOO.COM +1133,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-12-05,LORI COOK,F,1947-03-18,5722,POPEJASON@YAHOO.COM +1134,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-12-05,MATTHEW CARTER,M,1933-02-17,6616,OOCONNOR@GMAIL.COM +1135,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-12-05,CHRISTOPHER HARPER,M,1968-09-16,1871,AARNOLD@GMAIL.COM +1136,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-12-05,RYAN GONZALEZ,M,1913-06-05,4166,MARTINEZMARK@YAHOO.COM +1137,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-12-05,APRIL VELASQUEZ,F,1970-10-04,5276,FRANCISSARA@GMAIL.COM +1138,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-12-06,JASON BARNETT,M,1973-08-29,9030,ROBERTGRAY@GMAIL.COM +1139,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-12-06,TAMMY JIMENEZ,F,1931-03-13,1804,HARRISCHRISTINA@HOTMAIL.COM +1140,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-12-06,NICHOLAS MORGAN,M,1939-09-20,2301,ROBERTSUMMERS@GMAIL.COM +1141,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-12-06,STEVEN MCCALL,M,1943-05-28,2848,VGARRETT@YAHOO.COM +1142,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-12-06,CHARLES SCHMIDT,M,2021-11-02,5401,SUSANHURLEY@HOTMAIL.COM +1143,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-12-06,DAVID SANTANA,M,1918-08-09,6317,REBECCAJOHNSON@HOTMAIL.COM +1144,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-12-06,JACK KENNEDY,M,1929-09-19,3180,ALEXANDRANOLAN@HOTMAIL.COM +1145,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-12-06,COURTNEY CUNNINGHAM,F,1975-05-03,5461,JACQUELINE49@GMAIL.COM +1146,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-12-06,BRIAN VALENCIA,M,1996-01-06,5707,COLLIERBRIAN@HOTMAIL.COM +1147,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-12-06,JOHN WILLIAMS,M,1947-09-15,2324,DAWN87@GMAIL.COM +1148,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-12-06,WALTER MEYER,M,1984-04-08,5633,JEREMY45@HOTMAIL.COM +1149,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-12-06,HEIDI HERNANDEZ,F,1912-07-18,7011,KATHLEENBAKER@HOTMAIL.COM +1150,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-12-06,SERGIO PEARSON,M,1952-04-16,3197,SUSAN89@YAHOO.COM +1151,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-12-06,DAVID FRANK,M,1944-01-23,4168,ANTHONY45@GMAIL.COM +1152,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-12-07,ANGELA WILLIS,F,1997-04-04,8512,MNEWTON@GMAIL.COM +1153,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-12-07,PHILLIP RICHARDSON,M,1924-08-14,3216,UHOLMES@GMAIL.COM +1154,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-12-07,OLIVIA PATTERSON,F,2014-05-05,1885,PATRICIA85@YAHOO.COM +1155,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-12-07,NANCY WALL,F,1965-09-12,7113,MCINTOSHLINDSAY@YAHOO.COM +1156,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-12-07,JOANN GIBSON,F,1919-05-14,1893,REBECCAALLEN@GMAIL.COM +1157,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-12-07,MELISSA HOGAN,F,2020-10-10,4601,JESUS78@GMAIL.COM +1158,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-12-07,SUZANNE MCDANIEL,F,1931-11-01,9303,SARAH44@YAHOO.COM +1159,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-12-07,MICHAEL RAMOS,M,1967-09-26,1865,EILEEN73@HOTMAIL.COM +1160,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-12-07,RENEE PENA,F,1911-07-16,5770,PERRYJAMES@HOTMAIL.COM +1161,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-12-08,CHARLES JONES,M,2000-06-11,5733,MELISSA41@YAHOO.COM +1162,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-12-08,MONICA WILSON,F,1941-12-27,5757,CLIFFORD69@YAHOO.COM +1163,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-12-08,ANGELA GREER,F,1965-07-02,7633,EDWINMARSHALL@GMAIL.COM +1164,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-12-08,NICHOLE LOPEZ,F,1959-09-17,7621,KIMBERLYLYONS@YAHOO.COM +1165,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-12-08,MELINDA HOWARD,F,1965-03-30,5449,JESSICABROOKS@GMAIL.COM +1166,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-12-08,TIFFANY KIM,F,1957-03-17,3474,WRIGHTKRISTOPHER@YAHOO.COM +1167,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-12-09,JEREMY FERNANDEZ,M,1990-08-28,3260,PATTONDEBRA@YAHOO.COM +1168,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-12-09,BRANDY RUIZ,F,1938-07-24,5435,ANDREWMCBRIDE@HOTMAIL.COM +1169,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-12-09,PATRICIA LEE,F,2014-06-23,5587,NANDERSON@YAHOO.COM +1170,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-12-09,REBECCA SWEENEY,F,1958-10-09,6433,EHERNANDEZ@HOTMAIL.COM +1171,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-12-09,JANE SMITH,F,1920-02-24,9203,ARNOLDZACHARY@YAHOO.COM +1172,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-12-09,RONALD HICKS,M,1908-08-06,5460,JERRYMARTIN@YAHOO.COM +1173,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-12-09,JOEL OWEN,M,1925-05-15,6409,KEVINSALAS@YAHOO.COM +1174,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-12-09,ARTHUR JENKINS,M,1935-09-14,4182,THOMPSONMARK@HOTMAIL.COM +1175,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-12-09,TONY GREEN,M,2007-08-03,6601,BAXTERKRISTINA@YAHOO.COM +1176,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-12-10,BRITTANY STEWART,F,2020-11-16,9030,HERNANDEZNICOLE@YAHOO.COM +1177,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-12-10,COLLEEN MARTIN,F,2010-03-04,1770,BLAKEMAUREEN@YAHOO.COM +1178,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-12-10,JOSHUA BAILEY,M,1962-07-07,7153,DAVIDJONES@GMAIL.COM +1179,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-12-10,MATTHEW ALLISON,M,1960-08-24,2252,OWILLIAMS@YAHOO.COM +1180,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-12-10,MELANIE WILLIAMS,F,1966-02-20,1885,MATTHEW37@GMAIL.COM +1181,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-12-10,KATHRYN ALLEN,F,1970-12-20,2185,EATONBROOKE@HOTMAIL.COM +1182,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-12-10,SCOTT GEORGE,M,1988-11-16,2843,BRITTANY55@HOTMAIL.COM +1183,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-12-10,KEVIN MOLINA,M,1977-06-28,3470,RRIGGS@YAHOO.COM +1184,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-12-10,MARTHA FERRELL,F,1985-04-25,3592,BBEASLEY@HOTMAIL.COM +1185,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-12-10,HANNAH NICHOLS,F,1928-09-18,1987,QALLEN@YAHOO.COM +1186,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-12-10,ALLISON SMITH,F,1991-06-12,5615,ROBERT42@GMAIL.COM +1187,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-12-10,JOSEPH WATKINS,M,1916-05-27,4145,NICOLECALHOUN@HOTMAIL.COM +1188,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-12-11,RICHARD COOPER,M,1974-05-05,3700,TKING@YAHOO.COM +1189,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-12-11,DONNA BISHOP,F,1912-12-01,1636,DAVID59@GMAIL.COM +1190,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-12-11,JADE ARMSTRONG,F,1967-03-12,8370,QHENRY@GMAIL.COM +1191,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-12-11,RYAN CONWAY,M,2005-03-10,1980,RALVAREZ@GMAIL.COM +1192,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-12-11,CASSANDRA LEE,F,2009-05-11,2905,PHILLIPSCARL@YAHOO.COM +1193,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-12-11,TIMOTHY SANTIAGO,M,1923-04-08,6472,SARA03@YAHOO.COM +1194,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-12-11,MORGAN DENNIS PHD,F,1945-12-22,2521,JOHNSONLEAH@YAHOO.COM +1195,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-12-11,JESSICA SALINAS,F,1933-03-11,5369,IJACKSON@GMAIL.COM +1196,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-12-11,RITA TAYLOR,F,1930-02-14,2843,KARENSMITH@GMAIL.COM +1197,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-12-11,SARAH TRAN,F,1966-02-28,8122,PETERMCLAUGHLIN@YAHOO.COM +1198,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-12-11,BRETT MEJIA,M,1913-11-06,8351,DCOOK@YAHOO.COM +1199,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-12-12,JUSTIN VALENZUELA,M,1917-01-29,5427,KELSEY42@GMAIL.COM +1200,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-12-12,CRAIG HAWKINS,M,1979-08-31,5331,KLINEANDREW@YAHOO.COM +1201,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-12-12,MR. JEFFREY VILLANUEVA,M,1962-12-18,8162,JAMES54@HOTMAIL.COM +1202,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-12-12,GRANT JACKSON,M,2012-05-31,2181,YJOHNSON@HOTMAIL.COM +1203,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-12-12,JOHN SANTOS,M,1919-06-09,1649,RWARREN@HOTMAIL.COM +1204,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-12-12,MICHAEL HOLMES,M,1960-08-29,9053,MSHAW@HOTMAIL.COM +1205,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-12-12,ALAN WALTER,M,1957-04-26,3480,MICHAEL36@HOTMAIL.COM +1206,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-12-12,ALEXANDER BAUTISTA,M,1988-07-04,7600,MCCLAINDANNY@GMAIL.COM +1207,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-12-12,DENISE HARPER,F,1941-07-06,1871,RALPH20@GMAIL.COM +1208,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-12-12,LAWRENCE CANNON,M,1917-06-10,3592,JESSICA37@HOTMAIL.COM +1209,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-12-12,MARK TREVINO,M,2008-07-30,5329,EHEATH@HOTMAIL.COM +1210,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-12-12,MARIA LARSON,F,1991-11-26,8164,CATHERINE31@GMAIL.COM +1211,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-12-12,ROBERT MYERS,M,1935-06-11,3449,JARVISJAMES@GMAIL.COM +1212,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-12-12,NICOLE GARZA,F,1975-07-12,2729,LINDAPOOLE@GMAIL.COM +1213,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-12-12,LEAH BAKER,F,1964-12-19,2258,APRILPARKS@GMAIL.COM +1214,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-12-13,JILLIAN HILL,F,1954-08-13,9401,DOUGLASRICE@YAHOO.COM +1215,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-12-13,TIMOTHY HENRY,M,2000-06-04,2154,ROBERTOROBINSON@YAHOO.COM +1216,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-12-13,MICHAEL FORD,M,2007-10-19,8158,NASHJUSTIN@HOTMAIL.COM +1217,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-12-13,JOHN MCBRIDE,M,1979-12-31,9030,IMEDINA@YAHOO.COM +1218,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-12-13,JOSHUA CARR,M,1970-08-25,3283,WEBBDEAN@HOTMAIL.COM +1219,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-12-13,JORDAN GOMEZ,M,1918-04-29,1897,DAVID93@YAHOO.COM +1220,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-12-13,MICHAEL MOORE,M,1972-03-31,1713,TFORBES@HOTMAIL.COM +1221,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-12-13,KEVIN RODRIGUEZ,M,2021-10-26,1865,MELISSADELGADO@YAHOO.COM +1222,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-12-13,WILLIAM BELL,M,1957-02-12,2109,ERIN70@GMAIL.COM +1223,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-12-13,COURTNEY ANDERSON MD,F,1993-01-05,1615,DUDLEYMICHAEL@HOTMAIL.COM +1224,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-12-13,CAROL HUDSON,F,2002-01-12,7241,FAGUILAR@HOTMAIL.COM +1225,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-12-13,DENISE KENNEDY,F,2007-04-24,6632,EBISHOP@YAHOO.COM +1226,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-12-14,ERIC CHASE,M,1968-01-19,2449,LOPEZEMILY@HOTMAIL.COM +1227,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-12-14,JO SHIELDS,F,1963-02-06,1678,HSHIELDS@YAHOO.COM +1228,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-12-14,DANIELLE WOLFE,F,2002-02-03,7205,CARLSONPHILLIP@HOTMAIL.COM +1229,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-12-14,MRS. JESSICA HARDY,F,2002-07-11,2152,GLENNKYLE@HOTMAIL.COM +1230,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-12-14,JOHNNY BOWMAN,M,1951-02-20,1617,HESSSAMANTHA@HOTMAIL.COM +1231,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-12-14,CATHERINE HUBBARD,F,1943-04-21,3700,LESLIE55@HOTMAIL.COM +1232,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-12-14,ANGELA LOWE,F,1912-01-29,9105,RHUNT@HOTMAIL.COM +1233,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-12-14,VICTORIA SANCHEZ,F,1993-03-16,1623,QCLARKE@YAHOO.COM +1234,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-12-14,MISS CARRIE WILLIAMS,F,2015-12-16,4622,ASANCHEZ@GMAIL.COM +1235,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-12-14,GILBERT GREEN,M,2000-06-01,5317,MARK28@YAHOO.COM +1236,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-12-14,RACHEL MARTINEZ,F,1988-09-27,5386,JONATHAN93@HOTMAIL.COM +1237,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-12-14,JOE DAVIS,M,1940-06-04,5553,SUSAN59@HOTMAIL.COM +1238,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-12-14,SARAH STANLEY,F,1961-07-29,6221,MEDINABILLY@YAHOO.COM +1239,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-12-15,ROBERT AYALA,M,1918-06-29,6748,ASHLEY71@YAHOO.COM +1240,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-12-15,JOSEPH DAVIS,M,1912-02-27,2349,WOODDENNIS@YAHOO.COM +1241,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-12-15,CHRISTOPHER HALL,M,1918-08-25,3380,MATHISJACOB@GMAIL.COM +1242,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-12-15,TAMMY SANDERS,F,1911-07-12,3405,FELICIAROMERO@YAHOO.COM +1243,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-12-15,CHELSEA WONG,F,2018-08-30,8183,MARCUS90@HOTMAIL.COM +1244,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-12-15,CHRISTOPHER WHITE,M,1961-12-07,7151,XREILLY@HOTMAIL.COM +1245,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-12-15,JONATHAN SKINNER,M,2010-02-25,6405,KATHY67@YAHOO.COM +1246,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-12-15,MICHAEL WOODARD,M,1938-05-17,6505,KIMBERLY82@YAHOO.COM +1247,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-12-15,LARRY HERNANDEZ,M,2008-07-20,6305,TRAVISMEDINA@HOTMAIL.COM +1248,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-12-15,JOHN BENTON,M,2007-11-06,1669,KIMBERLY17@YAHOO.COM +1249,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-12-15,LESLIE GRAY,F,1913-03-13,5438,JACQUELINEMILLER@GMAIL.COM +1250,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-12-16,MORGAN SCHROEDER,F,1996-02-02,6387,FHARPER@HOTMAIL.COM +1251,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-12-16,MICHAEL DAVIES,M,1924-02-22,5527,ELLISLAURA@GMAIL.COM +1252,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-12-16,WILLIAM BURNETT,M,1909-06-18,2752,REBECCA10@GMAIL.COM +1253,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-12-16,REBECCA JORDAN,F,1927-01-11,7118,JENNIFERPENNINGTON@HOTMAIL.COM +1254,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-12-17,PETER SALAZAR,M,1952-10-25,2609,KERRY32@GMAIL.COM +1255,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-12-17,SHAWN WELCH,M,1909-02-16,3199,TRACIE41@HOTMAIL.COM +1256,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-12-17,JOHN GARCIA,M,1912-11-14,9301,FRANK69@HOTMAIL.COM +1257,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-12-17,MRS. NICOLE FARMER MD,F,2002-06-11,5311,ASHLEY41@GMAIL.COM +1258,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-12-17,SANDRA FITZGERALD,F,2007-03-23,7607,REESEMEGAN@YAHOO.COM +1259,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-12-17,WILLIAM GILL,M,1940-08-01,5419,LEWISJULIE@HOTMAIL.COM +1260,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-12-17,DENISE SCOTT,F,2020-03-28,5590,NELSONJENNIFER@YAHOO.COM +1261,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-12-17,JENNIFER CAMPBELL,F,1946-08-05,2454,ANN68@GMAIL.COM +1262,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-12-17,MARY MARSHALL,F,1925-06-19,2124,RICHARDSONANDRES@GMAIL.COM +1263,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-12-17,NICOLE BRENNAN,F,1929-01-18,3023,WESTWILLIAM@GMAIL.COM +1264,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-12-17,JONATHAN GONZALEZ,M,1985-06-30,3234,STEVEARMSTRONG@GMAIL.COM +1265,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-12-18,DAVID FERNANDEZ,M,1962-05-27,1642,AUSTIN97@YAHOO.COM +1266,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-12-18,TIMOTHY FISHER,M,1924-11-04,3567,VLAWRENCE@GMAIL.COM +1267,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-12-18,DESIREE GREEN MD,F,1993-01-08,6235,MARYBRAY@GMAIL.COM +1268,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-12-18,RACHEL RIVERA,F,1947-10-12,6300,OBROWN@YAHOO.COM +1269,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-12-18,DOROTHY SPEARS,F,2018-08-10,5361,KEVINCOHEN@HOTMAIL.COM +1270,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-12-18,DANNY DAVIS,M,1990-09-28,7404,COLLINHAMILTON@YAHOO.COM +1271,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-12-18,FELICIA STEWART,F,2007-05-09,5751,HLOVE@HOTMAIL.COM +1272,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-12-18,REGINALD ROSS,M,1911-11-02,2854,KDAWSON@HOTMAIL.COM +1273,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-12-18,JENNIFER MCCONNELL,F,1986-08-20,2912,SANCHEZSEAN@GMAIL.COM +1274,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-12-18,MARY REYES,F,1998-05-16,6360,BRIANAUSTIN@HOTMAIL.COM +1275,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-12-18,SEAN KELLER,M,2019-07-13,4151,UTYLER@YAHOO.COM +1276,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-12-18,MICHAEL ANDERSON,M,1959-01-20,3530,EREED@YAHOO.COM +1277,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-12-18,STEVEN RASMUSSEN,M,1958-01-24,3583,MARIO10@GMAIL.COM +1278,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-12-18,LISA OSBORNE,F,1940-12-23,4655,GUERREROBENJAMIN@HOTMAIL.COM +1279,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-12-19,EMILY WHITE,F,1953-04-08,4133,YMYERS@GMAIL.COM +1280,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-12-19,DAVID MCGRATH,M,1914-04-06,2183,OMORGAN@GMAIL.COM +1281,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-12-19,MARK ERICKSON,M,1992-03-23,2173,SNYDERALICIA@YAHOO.COM +1282,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-12-19,JULIE FERNANDEZ,F,1958-05-15,2751,SMITHALICIA@YAHOO.COM +1283,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-12-19,LAUREN BAKER PHD,F,1984-04-17,1776,NELSONSCOTT@HOTMAIL.COM +1284,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-12-19,KATHRYN FOX,F,1916-06-15,3181,SIMPSONCHARLES@GMAIL.COM +1285,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-12-19,RACHEL FARRELL,F,1971-05-14,8315,JONATHON82@YAHOO.COM +1286,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-12-19,JEFFREY HENDERSON,M,1921-06-10,5300,DURANJAMES@YAHOO.COM +1287,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2020-12-19,ALEXANDRA CHRISTIAN,F,1938-12-01,2204,VLYONS@HOTMAIL.COM +1288,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-12-19,JILLIAN HENDERSON,F,1984-01-22,3192,KATHYGRAHAM@YAHOO.COM +1289,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-12-20,MARY MILLER,F,1969-08-28,8363,BRYANTSHANNON@GMAIL.COM +1290,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-12-20,LARRY JONES,M,1984-08-18,9033,MIGUEL35@HOTMAIL.COM +1291,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-12-20,SCOTT ROSS,M,1931-04-13,8375,BRENDA35@HOTMAIL.COM +1292,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-12-20,RICKY VILLARREAL,M,1935-12-10,6381,ZVALDEZ@GMAIL.COM +1293,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-12-20,JEFF ONEILL,M,1939-08-15,3503,JULIE39@GMAIL.COM +1294,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-12-20,RONALD DIAZ,M,1978-03-29,1888,HEATHER84@HOTMAIL.COM +1295,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-12-20,DR. JUSTIN KLEIN JR.,M,1989-03-23,9210,ROBERTVEGA@GMAIL.COM +1296,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-12-20,RICHARD AYALA,M,1939-02-18,3364,GMARTINEZ@HOTMAIL.COM +1297,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-12-20,KYLE DAVENPORT,M,1928-02-12,5573,JGUERRERO@HOTMAIL.COM +1298,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-12-20,JOSEPH WILSON,M,1975-06-10,3261,VMOORE@YAHOO.COM +1299,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-12-20,RAYMOND MOORE,M,2000-10-04,2728,DENISEOBRIEN@HOTMAIL.COM +1300,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-12-20,BETTY RIVERA,F,1984-01-21,6325,SCOTTDAVIS@GMAIL.COM +1301,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-12-20,BRENDA MOORE,F,1929-11-08,3465,DAVIDSONJACOB@HOTMAIL.COM +1302,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-12-20,ROBERT HAHN,M,1907-07-01,8361,EDWARDRODRIGUEZ@HOTMAIL.COM +1303,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-12-20,DONALD WRIGHT,M,1961-06-20,9305,ANGELA77@HOTMAIL.COM +1304,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-12-20,JULIE ROBERTSON,F,1934-12-07,2407,CJONES@YAHOO.COM +1305,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-12-20,KEVIN RICHARDSON,M,2014-04-21,9013,CHRISTINEJOHNSON@GMAIL.COM +1306,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-12-21,TAYLOR TAYLOR,F,1949-03-15,6352,JEREMYJONES@HOTMAIL.COM +1307,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-12-21,NANCY FLORES,F,1948-02-16,1755,JACKSONCANTRELL@GMAIL.COM +1308,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-12-21,JESSICA MORALES,F,1969-04-23,5759,RMAY@GMAIL.COM +1309,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-12-21,HEATHER RIVERA,F,1922-03-08,6237,DONALD66@GMAIL.COM +1310,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-12-21,KAREN OCONNOR,F,1931-06-22,9051,GYOUNG@GMAIL.COM +1311,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-12-21,JOSE WILSON,M,1971-02-11,2500,YSTEWART@YAHOO.COM +1312,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-12-21,PATRICIA ROBLES,F,1989-12-28,6608,GDUNN@HOTMAIL.COM +1313,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2020-12-21,ERIC DONOVAN,M,1906-01-26,2313,JEANETTEALVAREZ@YAHOO.COM +1314,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-12-21,FELICIA MILLER,F,1977-10-27,3516,CJOHNSON@GMAIL.COM +1315,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-12-21,DENISE PAYNE,F,1913-04-30,6064,CAMACHOBRIAN@HOTMAIL.COM +1316,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-12-21,DENISE MEYERS,F,1927-08-11,1804,SHERIPAYNE@GMAIL.COM +1317,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-12-22,LINDSAY PARKER,F,1956-07-30,9213,SIMONDEREK@HOTMAIL.COM +1318,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-12-22,SAMANTHA BAKER,F,1940-05-05,2918,SAMANTHADOUGLAS@GMAIL.COM +1319,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-12-22,ASHLEY HAMILTON,F,2000-01-16,1640,PECKCHRIS@HOTMAIL.COM +1320,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-12-22,VINCENT RODGERS,M,1923-06-17,8156,MELISSA16@HOTMAIL.COM +1321,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-12-22,JAMES NELSON,M,1994-08-13,7547,JAMESMARTINEZ@YAHOO.COM +1322,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-12-22,STEVEN HENDERSON,M,1964-07-09,5429,TIFFANYMOODY@GMAIL.COM +1323,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-12-22,ALEXANDER AGUILAR,M,1961-04-17,6559,KELLYANGELA@HOTMAIL.COM +1324,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-12-22,THEODORE AVILA,M,1955-03-19,3334,HARTMEGAN@GMAIL.COM +1325,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-12-22,STEVEN HAWKINS,M,1906-09-12,2826,JAREDARMSTRONG@YAHOO.COM +1326,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-12-22,TRACY CLARK,F,1952-12-21,2601,STEPHANIEWHITE@GMAIL.COM +1327,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-12-22,SCOTT BAILEY,M,1997-01-03,9101,LARRY54@GMAIL.COM +1328,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-12-22,CHRISTOPHER BELL,M,2008-02-07,1757,EGALLEGOS@YAHOO.COM +1329,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-12-22,SCOTT MARTIN,M,2000-01-11,1647,FREDERICK23@YAHOO.COM +1330,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-12-23,KRYSTAL HILL,F,1981-02-19,1828,GREGORYGRIFFITH@GMAIL.COM +1331,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2020-12-23,JESSICA COLLINS,F,2020-03-30,3480,HOWELLKEITH@HOTMAIL.COM +1332,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-12-23,KATHERINE CALDWELL,F,1973-11-15,3446,ANGELA44@GMAIL.COM +1333,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-12-23,LISA BONILLA PHD,F,2007-07-07,3342,JENNIFERMILES@GMAIL.COM +1334,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-12-23,KRISTINA RODRIGUEZ,F,1944-10-26,3016,WESTSTEVEN@YAHOO.COM +1335,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-12-23,BRYAN HALL,M,2002-07-26,7172,DANIEL68@YAHOO.COM +1336,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-12-23,SARA GRIFFIN,F,1923-10-31,3267,ELAINEGALLOWAY@YAHOO.COM +1337,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-12-23,JACQUELINE ADAMS,F,2020-10-13,3300,JONATHAN33@GMAIL.COM +1338,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-12-23,KRISTEN FLETCHER,F,1942-02-02,6341,JOSEPHLOWERY@GMAIL.COM +1339,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-12-23,AMANDA HENRY,F,1929-03-28,6471,UWAGNER@GMAIL.COM +1340,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-12-23,HEIDI TYLER,F,1976-10-17,3487,DAVID21@GMAIL.COM +1341,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-12-23,SEAN ZHANG,M,1961-03-13,9015,ERIK60@GMAIL.COM +1342,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2020-12-23,JEFFREY MILLER,M,1986-10-29,8208,JOHNTHOMPSON@GMAIL.COM +1343,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-12-23,GARY CHRISTENSEN,M,1993-07-22,5505,JAMES83@HOTMAIL.COM +1344,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-12-24,JASON FRANCO,M,1970-08-27,5883,HILLSTEVEN@HOTMAIL.COM +1345,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-12-24,RODNEY PATTERSON,M,1955-02-09,7517,COURTNEYCISNEROS@GMAIL.COM +1346,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-12-24,MRS. ASHLEE SIMMONS MD,F,1924-11-16,3150,YSMITH@HOTMAIL.COM +1347,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-12-24,JACK FREEMAN,M,2005-02-19,3032,XHARTMAN@YAHOO.COM +1348,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-12-24,MICHAELA GIBSON,F,1915-05-18,3581,AARONSANCHEZ@GMAIL.COM +1349,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2020-12-24,SAMUEL JUAREZ,M,1926-01-15,5442,BPATTERSON@GMAIL.COM +1350,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-12-24,JOHN GREEN,M,1938-12-12,7400,ALEXANDERKAREN@GMAIL.COM +1351,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-12-24,LINDA BAKER,F,1928-02-05,6034,WTAYLOR@YAHOO.COM +1352,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-12-24,HOLLY MCDONALD,F,1948-01-11,6345,BRETT37@GMAIL.COM +1353,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-12-24,JENNIFER EVANS,F,1998-08-29,6555,USCHMIDT@HOTMAIL.COM +1354,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-12-24,COLLEEN PERKINS,F,1983-12-26,3025,MITCHELLCARLY@HOTMAIL.COM +1355,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-12-24,YESENIA BARRETT,F,1962-12-19,6042,KSAWYER@HOTMAIL.COM +1356,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-12-24,ARTHUR SHAW,M,2017-02-02,5709,JOHNWHEELER@GMAIL.COM +1357,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-12-24,REBECCA BROWN,F,1945-06-25,6472,NICHOLASJONES@GMAIL.COM +1358,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-12-25,RYAN WELCH,M,2016-12-20,1915,BETHCAMPBELL@GMAIL.COM +1359,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-12-25,JULIE JOHNSON,F,1975-05-08,4618,JAMES61@HOTMAIL.COM +1360,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-12-25,LINDA FRANCO,F,1996-07-14,4113,AKING@GMAIL.COM +1361,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-12-25,JOSHUA TURNER,M,1907-10-21,2240,CHRISTOPHER85@GMAIL.COM +1362,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-12-25,JASON MULLINS,M,1998-06-19,2611,COURTNEY33@HOTMAIL.COM +1363,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-12-25,ANDREA RYAN,F,1989-08-27,9120,KEVINDECKER@GMAIL.COM +1364,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-12-25,SHANNON ORTEGA JR.,M,1978-04-28,5713,ALICIA56@HOTMAIL.COM +1365,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-12-25,KRISTEN PHELPS,F,1943-08-21,6203,MINGRAM@GMAIL.COM +1366,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-12-25,MICHAEL CASTILLO,M,1987-03-26,2154,SFOX@GMAIL.COM +1367,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-12-25,BRADLEY MILES,M,1927-01-05,6331,FLORESROBERT@YAHOO.COM +1368,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-12-25,JANET BAUER,F,1958-01-04,3581,ROBERT12@GMAIL.COM +1369,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2020-12-25,DANIEL ARMSTRONG,M,1947-07-18,1735,BJOHNSON@HOTMAIL.COM +1370,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2020-12-25,NICOLE JOHNSON,F,1958-05-27,8375,SPENCER19@HOTMAIL.COM +1371,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-12-25,CAROLYN FISHER,F,1958-07-17,7221,TAMMYAUSTIN@YAHOO.COM +1372,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-12-25,JOSE VAUGHN,M,1996-02-08,3137,ANDERSONCHERYL@GMAIL.COM +1373,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-12-25,MEGHAN WILLIAMS,F,1911-01-05,9311,BURKEDAVID@HOTMAIL.COM +1374,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-12-26,ROBERT WANG,M,1929-06-30,6632,JENNIFER19@GMAIL.COM +1375,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-12-26,KAREN WILSON,F,1950-11-06,3040,MICHELE22@YAHOO.COM +1376,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-12-26,CARRIE FERGUSON,F,1975-09-27,6300,MARTINBALL@YAHOO.COM +1377,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-12-26,ROBERT WEST,M,1932-02-18,2607,WHEELERDOUGLAS@YAHOO.COM +1378,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-12-26,HEIDI HUGHES,F,1982-07-29,2520,JOHN91@YAHOO.COM +1379,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-12-26,DEBORAH ALVAREZ,F,2011-11-22,6369,CHAPMANCHRISTOPHER@HOTMAIL.COM +1380,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-12-26,JASON ROJAS,M,1987-10-27,1648,CHRISTINAPATRICK@HOTMAIL.COM +1381,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-12-26,APRIL FLYNN,F,1922-06-28,3705,FFISCHER@HOTMAIL.COM +1382,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-12-26,JANICE ROBINSON,F,1982-12-03,7301,ROACHALEXANDRA@YAHOO.COM +1383,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-12-26,KIMBERLY HAYES,F,2006-01-31,3056,TRACEY11@YAHOO.COM +1384,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-12-27,LINDSAY JOHNSON,F,1911-11-29,3050,RJONES@HOTMAIL.COM +1385,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2020-12-27,CODY SMITH,M,2008-03-10,3705,KESTRADA@YAHOO.COM +1386,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-12-27,JESSICA DOMINGUEZ,F,1943-08-13,7225,MICHAELDIAZ@HOTMAIL.COM +1387,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-12-27,MARK ALVARADO,M,1990-11-15,5513,COLLEENRICHARDSON@YAHOO.COM +1388,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-12-27,CATHERINE REYNOLDS,F,2013-01-03,3466,HANNAHVAUGHN@YAHOO.COM +1389,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-12-27,SHELLY TAYLOR,F,1911-07-03,7623,MCKINNEYJACOB@GMAIL.COM +1390,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-12-27,JENNIFER BOYD,F,2006-11-01,3185,GENTRYJENNIFER@YAHOO.COM +1391,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-12-27,WILLIE LEE,M,1918-11-26,8334,ROBINWILLIAMS@GMAIL.COM +1392,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-12-27,RYAN CURTIS,M,2020-12-01,5779,TRAVISBAIRD@GMAIL.COM +1393,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2020-12-27,ROBERT COX,M,2016-12-11,7408,WASHINGTONLISA@HOTMAIL.COM +1394,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2020-12-27,KRISTEN PERKINS,F,1968-09-01,6475,YHERNANDEZ@HOTMAIL.COM +1395,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-12-28,ROBERT GREGORY,M,2004-09-17,3254,RHODESJENNIFER@HOTMAIL.COM +1396,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-12-28,ANGELA PRUITT,F,1952-09-30,7407,SCHAMBERS@HOTMAIL.COM +1397,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-12-28,AARON ROY,M,1918-10-13,3200,LINDSEY61@HOTMAIL.COM +1398,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2020-12-28,SARAH JOHNSON,F,1969-11-30,5592,CLARKEALLISON@GMAIL.COM +1399,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-12-28,NATHAN JOHNSON,M,1911-07-10,3722,PETERWHITE@HOTMAIL.COM +1400,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2020-12-28,WILLIAM JOHNSON,M,2001-07-12,3117,SMITHCODY@YAHOO.COM +1401,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2020-12-28,DIANA HINES,F,1954-12-29,6326,FSMITH@YAHOO.COM +1402,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2020-12-28,ZACHARY STAFFORD MD,M,1908-04-23,6348,TAYLORSHORT@GMAIL.COM +1403,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-12-28,JASON BROWN,M,1946-05-19,6042,CRYSTALMCCOY@HOTMAIL.COM +1404,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-12-28,CHRISTOPHER WALKER DDS,M,1940-01-19,7169,CHRISTINAMENDOZA@YAHOO.COM +1405,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2020-12-28,JACQUELINE HAMILTON,F,1986-10-03,5615,THOMAS65@GMAIL.COM +1406,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2020-12-28,TROY NELSON,M,1948-04-25,8113,COLLINSJENNIFER@GMAIL.COM +1407,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-12-28,KYLE SAUNDERS DDS,M,2006-02-15,9405,GLORIAWILSON@HOTMAIL.COM +1408,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-12-29,AMBER STEVENSON,F,1908-02-05,6032,JEFFMORGAN@HOTMAIL.COM +1409,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-12-29,JENNIFER LAM,F,1955-10-30,2633,PEREZJEREMY@HOTMAIL.COM +1410,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2020-12-29,JASON DEAN,M,1916-02-23,6403,AUSTINCARLSON@HOTMAIL.COM +1411,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2020-12-29,MADELINE CALDWELL,F,1955-04-19,3020,OSBORNEJOY@HOTMAIL.COM +1412,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-12-29,JOE RODRIGUEZ,M,1964-12-28,5738,ISAIAHWILCOX@YAHOO.COM +1413,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-12-29,ZACHARY REEVES,M,2010-05-23,3332,TOWNSENDDAWN@YAHOO.COM +1414,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2020-12-29,EDDIE WATKINS,M,1925-10-31,5605,MARTINRANDALL@YAHOO.COM +1415,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2020-12-29,DAWN MARTINEZ,F,1946-02-01,8183,SUMMERSALEXANDER@YAHOO.COM +1416,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-12-30,JORDAN BROOKS,M,1994-12-22,8109,KRISTINHOWE@GMAIL.COM +1417,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-12-30,RICHARD SINGH,M,1914-08-16,6621,HKRAMER@GMAIL.COM +1418,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-12-30,KAREN CASTRO,F,1931-07-06,6348,ERICKRUEGER@HOTMAIL.COM +1419,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-12-30,WAYNE HAYDEN,M,1941-07-31,3592,FARMERSUSAN@YAHOO.COM +1420,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2020-12-30,GREGORY BLAIR,M,1910-11-14,3174,KARENCOCHRAN@YAHOO.COM +1421,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-12-31,JONATHAN SHELTON,M,1981-09-21,6463,DAVIDLAWSON@YAHOO.COM +1422,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2020-12-31,LARRY GEORGE,M,1919-07-31,4133,DAVIDROBINSON@HOTMAIL.COM +1423,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2020-12-31,DEBRA JONES,F,1918-09-11,5470,ADAMSROBERT@GMAIL.COM +1424,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-12-31,MICHELE FIELDS,F,2002-06-23,4111,ECAREY@YAHOO.COM +1425,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2020-12-31,KELLY WHITE,F,2002-05-06,1737,JSALINAS@HOTMAIL.COM +1426,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2020-12-31,TINA MACDONALD,F,1961-09-17,1838,JUSTIN58@GMAIL.COM +1427,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2020-12-31,COLE ELLIS,M,2002-07-15,4147,LAURENGRAY@HOTMAIL.COM +1428,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2020-12-31,NATASHA ARNOLD,F,1944-04-30,2170,CHRISTOPHERWADE@YAHOO.COM +1429,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2020-12-31,SHELLEY RODGERS,F,1925-07-08,1678,JOHN99@GMAIL.COM +1430,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2020-12-31,MARK SCOTT,M,1992-05-08,8127,KIMBERLYDAVIS@YAHOO.COM +1431,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2020-12-31,SARAH LEE,F,1936-12-07,5529,CRAIGTHOMAS@GMAIL.COM +1432,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2020-12-31,JULIE BROWNING,F,1906-08-17,1682,WEBERRANDY@YAHOO.COM +1433,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2020-12-31,LISA DAVIS,F,1977-11-11,2121,IALLEN@GMAIL.COM +1434,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2020-12-31,LISA DOWNS,F,1979-10-20,6727,MONICA97@GMAIL.COM +1435,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2021-01-01,GARRETT NAVARRO,M,2007-01-07,1631,PDOUGLAS@GMAIL.COM +1436,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2021-01-01,COURTNEY GAY,F,2007-08-16,1858,ANDREAFROST@GMAIL.COM +1437,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2021-01-01,WENDY AGUILAR,F,1914-04-06,6533,HOLTEMILY@YAHOO.COM +1438,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2021-01-01,ROBERT ROGERS,M,1946-10-28,4504,STEWARTCRYSTAL@GMAIL.COM +1439,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2021-01-01,SARAH KEY,F,1997-09-05,3416,SMITHMICHELLE@GMAIL.COM +1440,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2021-01-01,STEPHEN MATHIS,M,1947-04-18,5557,CHRISTINE82@YAHOO.COM +1441,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2021-01-01,LISA PALMER,F,1930-05-14,3530,ANTHONY05@HOTMAIL.COM +1442,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2021-01-01,NICHOLE JACKSON,F,2009-10-27,3351,SBASS@GMAIL.COM +1443,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2021-01-01,SUSAN GARCIA,F,1994-01-02,7150,GSCOTT@HOTMAIL.COM +1444,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2021-01-01,MELINDA GUTIERREZ,F,1960-08-22,1891,HALVARADO@HOTMAIL.COM +1445,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2021-01-01,JOHN GLOVER,M,2007-09-08,6434,MORRISKEVIN@GMAIL.COM +1446,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2021-01-02,JILL GARCIA,F,1947-09-19,3450,MEGANFARMER@HOTMAIL.COM +1447,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2021-01-02,WAYNE REYNOLDS,M,2016-09-27,9007,JOHNCABRERA@HOTMAIL.COM +1448,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2021-01-02,JASON WALL,M,1975-03-22,2242,FLOVE@YAHOO.COM +1449,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2021-01-02,LAURA JOHNSON,F,1981-08-07,5873,JACOB67@YAHOO.COM +1450,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2021-01-02,KAREN SCOTT,F,2014-11-30,8333,TAYLORHOLMES@GMAIL.COM +1451,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2021-01-02,JOY BRYANT,F,1975-12-13,9009,CONNOR86@GMAIL.COM +1452,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2021-01-02,KEVIN HERNANDEZ,M,1977-10-30,3423,RICHARDSCHARLES@HOTMAIL.COM +1453,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2021-01-02,DOUGLAS THOMAS,M,1993-04-14,5596,BRANDY35@HOTMAIL.COM +1454,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2021-01-02,TINA SMITH,F,1913-09-05,8500,HLOPEZ@GMAIL.COM +1455,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2021-01-02,BOBBY LOWE,M,1994-09-12,8111,HAYLEY34@YAHOO.COM +1456,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2021-01-02,MRS. NATALIE NELSON DVM,F,1995-03-12,1646,JOHNSHAW@YAHOO.COM +1457,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2021-01-02,ERIKA FLORES,F,1994-09-05,5465,ADAMSWILLIAM@GMAIL.COM +1458,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2021-01-02,JOANN CHARLES,F,1967-11-20,2852,YDAVIS@GMAIL.COM +1459,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2021-01-02,MICHELLE HARRIS,F,1995-08-13,3214,GOODROBERT@YAHOO.COM +1460,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2021-01-03,ALBERT MORAN,M,1997-09-28,3190,ELLEN71@HOTMAIL.COM +1461,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2021-01-03,ROBERT NIELSEN,M,1987-05-16,5615,CYNTHIA17@YAHOO.COM +1462,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2021-01-03,PARKER HUNTER,M,2005-10-16,1619,MICHEALDAVIS@HOTMAIL.COM +1463,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2021-01-03,JUSTIN FRANKLIN,M,1994-05-13,4740,KKAUFMAN@GMAIL.COM +1464,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2021-01-03,JENNIFER SCHROEDER,F,2015-01-20,2722,DANIELLE61@YAHOO.COM +1465,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2021-01-03,SCOTT COLEMAN,M,1930-05-23,3158,GUTIERREZSCOTT@HOTMAIL.COM +1466,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2021-01-03,ERIC THOMPSON,M,2000-06-15,1894,LAUREN78@GMAIL.COM +1467,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2021-01-03,JULIE WILSON,F,1982-07-04,3583,MICHELLE69@HOTMAIL.COM +1468,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2021-01-03,TODD BROWN,M,2007-07-24,3287,MARTINJAMES@HOTMAIL.COM +1469,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2021-01-03,SARAH ROBERTS,F,1991-05-17,2218,WRIGHTBRENDAN@HOTMAIL.COM +1470,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2021-01-03,THOMAS SILVA,M,2000-06-26,1864,DAVIDFOSTER@HOTMAIL.COM +1471,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2021-01-03,SHANE TAYLOR,M,1909-09-16,3509,HENDERSONAMBER@HOTMAIL.COM +1472,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2021-01-03,ANNA PHILLIPS,F,1906-06-22,5637,VAUGHNJOHN@YAHOO.COM +1473,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2021-01-03,MR. WALTER MARQUEZ,M,1910-11-22,7263,MICHAEL27@GMAIL.COM +1474,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2021-01-03,MISTY CARTER,F,2003-05-28,5751,TASHA15@YAHOO.COM +1475,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2021-01-03,RAYMOND WATSON,M,1924-10-22,5461,BRITTANYCHRISTIAN@HOTMAIL.COM +1476,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2021-01-04,JOSEPH MASON,M,1926-04-06,5622,FMATHIS@HOTMAIL.COM +1477,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2021-01-04,SABRINA ROBERTSON,F,1981-01-16,6348,FRANKLINMARK@GMAIL.COM +1478,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2021-01-04,BENJAMIN SIMMONS,M,1983-11-03,6434,KELLY15@HOTMAIL.COM +1479,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2021-01-04,DR. WILLIAM GRIMES JR.,M,1993-03-15,4600,NICOLECALLAHAN@GMAIL.COM +1480,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2021-01-04,ASHLEY RUSSELL,F,1927-02-23,2352,ANTHONY45@HOTMAIL.COM +1481,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2021-01-04,GEORGE WRIGHT,M,1963-12-08,8416,MEGAN83@YAHOO.COM +1482,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2021-01-04,AMANDA MCDANIEL,F,2004-10-27,5319,TAMMYSHARP@HOTMAIL.COM +1483,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2021-01-04,FELICIA COLEMAN,F,1929-05-11,8146,HWILLIAMS@YAHOO.COM +1484,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2021-01-05,JUDITH MCFARLAND,F,1919-01-08,3545,NGREEN@HOTMAIL.COM +1485,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2021-01-05,NORMA OWEN,F,1928-10-30,5719,XCAMPBELL@YAHOO.COM +1486,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2021-01-05,THEODORE SMITH,M,1934-06-18,9001,DUANE94@HOTMAIL.COM +1487,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2021-01-05,TYLER NGUYEN,M,1998-02-19,2501,PRUBIO@YAHOO.COM +1488,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2021-01-05,ELIZABETH ALVAREZ,F,2014-11-29,8521,IROBLES@HOTMAIL.COM +1489,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2021-01-05,KYLE HALL,M,1975-06-14,9420,CHRISTINA68@YAHOO.COM +1490,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2021-01-05,LINDSEY PARSONS,F,1961-02-06,5447,ACAMPBELL@GMAIL.COM +1491,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2021-01-05,ADAM HINES,M,1942-09-19,8370,ALVAREZKRISTIN@HOTMAIL.COM +1492,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2021-01-05,DAVID ROSS,M,1908-09-20,3114,RAUSTIN@GMAIL.COM +1493,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2021-01-05,MICHELE MILLER,F,1996-06-09,3041,TMOLINA@YAHOO.COM +1494,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2021-01-05,TAMARA JOHNSON,F,1915-11-14,2103,CATHERINEDANIELS@YAHOO.COM +1495,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2021-01-05,TREVOR NGUYEN,M,1938-07-05,9311,ALEXANDER06@GMAIL.COM +1496,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2021-01-05,MARIE BRUCE,F,1914-02-05,4643,VFREEMAN@GMAIL.COM +1497,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2021-01-06,DANIELLE MASON,F,1972-04-16,3555,DAVID48@YAHOO.COM +1498,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2021-01-06,ROBERT GRIFFITH,M,1938-02-11,3133,CHRISTIAN64@YAHOO.COM +1499,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2021-01-06,ELIZABETH MILLER,F,1966-11-05,2181,MONICA02@YAHOO.COM +1500,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2021-01-06,BRIAN NORTON,M,1929-09-30,6321,KRISTEN61@YAHOO.COM +1501,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2021-01-06,GAVIN TAYLOR,M,1909-08-06,3003,EDWARD24@HOTMAIL.COM +1502,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2021-01-06,HOWARD LEE,M,2013-01-07,8407,CHRISTIAN72@HOTMAIL.COM +1503,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2021-01-06,ELIZABETH SCOTT,F,1933-01-05,2400,WHITNEY13@HOTMAIL.COM +1504,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2021-01-06,ROBERT THOMAS,M,1915-10-29,9015,WOODARDJEREMY@HOTMAIL.COM +1505,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2021-01-06,GREGORY THOMPSON,M,1965-05-18,3371,MCDOWELLROBERT@GMAIL.COM +1506,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2021-01-06,RENEE SMITH,F,2016-01-24,6001,SCOLEMAN@HOTMAIL.COM +1507,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2021-01-06,DANIELLE THORNTON,F,1959-05-01,6439,NKING@HOTMAIL.COM +1508,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2021-01-06,ERIC ALLEN,M,1955-06-28,3513,MICHELLEBENSON@GMAIL.COM +1509,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2021-01-06,JESSICA DANIEL,F,2018-12-05,2723,GRANTBRENT@HOTMAIL.COM +1510,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2021-01-07,RICHARD MORGAN,M,1909-05-22,8124,ODONNELLGRANT@HOTMAIL.COM +1511,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2021-01-07,JILL REED,F,1939-06-17,5535,STEPHANIEGRIFFITH@GMAIL.COM +1512,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2021-01-07,CARMEN ESTRADA,F,1983-11-26,5609,WSMITH@GMAIL.COM +1513,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2021-01-07,MRS. ALEXANDRA RICHARDS,F,2012-01-09,5871,FSCOTT@HOTMAIL.COM +1514,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2021-01-07,TYLER SMITH,M,1975-04-28,1875,RITA46@YAHOO.COM +1515,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2021-01-07,RYAN ANDERSON,M,1920-03-18,2840,JOSEPHWHITE@GMAIL.COM +1516,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2021-01-07,ELAINE HOWELL,F,1918-03-26,2743,EDDIECLARK@GMAIL.COM +1517,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2021-01-07,ALLISON JONES,F,1973-09-05,7212,BETH01@HOTMAIL.COM +1518,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2021-01-07,SARA KLEIN,F,1998-02-13,2728,TANYABOONE@YAHOO.COM +1519,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2021-01-07,KRISTEN THOMAS,F,1982-01-06,8168,WILLIAM36@HOTMAIL.COM +1520,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2021-01-07,RONALD YOUNG,M,1960-06-04,1895,CHANDLERMARK@GMAIL.COM +1521,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2021-01-07,BRANDON JOHNSON,M,1941-09-15,3536,NEWMANMELISSA@HOTMAIL.COM +1522,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2021-01-07,DONNA SIMS,F,2005-10-14,3076,LINDSEYSAWYER@HOTMAIL.COM +1523,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2021-01-07,CHRISTOPHER BALLARD,M,1977-01-19,4147,VALEXANDER@HOTMAIL.COM +1524,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2021-01-08,KARINA PACE,F,1924-06-19,7311,RONALD53@YAHOO.COM +1525,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2021-01-08,BRETT HANSEN,M,2009-06-30,5881,XCOLE@YAHOO.COM +1526,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2021-01-08,JERRY JONES,M,1921-04-22,1812,IRICHARDSON@YAHOO.COM +1527,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2021-01-08,PATRICK SMITH,M,2007-05-16,3234,QNORMAN@YAHOO.COM +1528,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2021-01-08,LAUREN HUNTER,F,1974-01-18,1983,SGROSS@YAHOO.COM +1529,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2021-01-08,CHRISTIAN DENNIS,M,1971-09-03,6469,JOHNJONES@YAHOO.COM +1530,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2021-01-08,DEBORAH NOLAN,F,2010-10-07,4124,JBAKER@YAHOO.COM +1531,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2021-01-08,TIMOTHY HARRIS,M,1985-06-21,6538,QPIERCE@GMAIL.COM +1532,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2021-01-08,ANTHONY SWEENEY,M,1980-09-01,5722,BROOKERICE@HOTMAIL.COM +1533,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2021-01-08,VINCENT ANDERSON,M,1986-10-31,8309,UANDRADE@GMAIL.COM +1534,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2021-01-08,TAYLOR JENSEN,F,2010-02-03,3712,VANESSAWALL@YAHOO.COM +1535,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2021-01-08,DAVID CARDENAS,M,2014-04-01,3441,IRODRIGUEZ@YAHOO.COM +1536,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2021-01-08,DANIEL PITTS,M,1970-06-26,6317,WILLIAMSJESSICA@YAHOO.COM +1537,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2021-01-09,BRANDI MURRAY,F,1978-07-03,3407,VDAVIS@GMAIL.COM +1538,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2021-01-09,FRANK GREENE,M,2007-06-04,2637,TAYLORRILEY@YAHOO.COM +1539,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2021-01-09,MICHAEL PETERSON,M,1914-09-07,3382,MYERSJEFF@YAHOO.COM +1540,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2021-01-09,TIMOTHY ANDERSON,M,2012-05-23,5775,ODAVIES@HOTMAIL.COM +1541,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2021-01-09,JOHN MORROW,M,2019-10-09,3734,WBAILEY@YAHOO.COM +1542,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2021-01-09,MICHAEL MCDONALD,M,1957-09-19,3000,BENJAMIN45@YAHOO.COM +1543,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2021-01-09,AMY SMITH,F,1989-09-29,5750,ROBERTDANIELS@HOTMAIL.COM +1544,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2021-01-09,JAIME MARTINEZ,F,2019-03-19,8514,DANIELSWEENEY@YAHOO.COM +1545,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2021-01-09,KEITH COLLINS,M,1946-03-09,1921,CMILLER@YAHOO.COM +1546,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2021-01-09,JOSE LEE,M,1967-12-19,1882,HYOUNG@HOTMAIL.COM +1547,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2021-01-09,AUSTIN BARNETT,M,1932-04-14,4750,XROGERS@HOTMAIL.COM +1548,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2021-01-09,AMY FLORES,F,1950-10-10,8200,PCABRERA@HOTMAIL.COM +1549,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2021-01-09,DEANNA NEAL,F,2006-11-03,8403,TAYLORRICHARD@HOTMAIL.COM +1550,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2021-01-09,JESSICA EVANS,F,1992-03-13,1911,TINA86@HOTMAIL.COM +1551,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2021-01-09,SUZANNE PEARSON,F,1962-07-05,6330,KEITH43@YAHOO.COM +1552,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2021-01-09,ANDREW MCPHERSON,M,1987-12-28,2814,TURNERANGELA@GMAIL.COM +1553,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2021-01-09,JAY ROBINSON,M,1972-08-10,2156,GCHAVEZ@GMAIL.COM +1554,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2021-01-09,KENNETH HERNANDEZ DDS,M,1909-02-27,1625,PUGHREBECCA@HOTMAIL.COM +1555,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2021-01-09,KATHERINE BROWN DDS,F,1979-05-22,3378,FERNANDEZMARIA@HOTMAIL.COM +1556,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2021-01-10,ELIZABETH AVILA,F,1912-05-24,5703,WILLIAMMCCORMICK@HOTMAIL.COM +1557,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2021-01-10,STEVEN GROSS,M,1916-03-14,2318,AMY54@HOTMAIL.COM +1558,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2021-01-10,PETER RHODES,M,1911-07-03,3380,VCAREY@YAHOO.COM +1559,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2021-01-10,CASSANDRA ACOSTA,F,1987-01-01,8332,WAYNE25@GMAIL.COM +1560,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2021-01-10,BRAD GONZALEZ,M,1967-03-27,4186,LEAHWOODS@YAHOO.COM +1561,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2021-01-10,CAROLYN BYRD,F,1985-10-27,8403,ANDREOWENS@GMAIL.COM +1562,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2021-01-10,ELIZABETH LAM,F,1917-10-07,6400,AUSTINTHOMAS@HOTMAIL.COM +1563,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2021-01-10,TRAVIS BELL,M,1918-02-14,6326,DANIEL95@HOTMAIL.COM +1564,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2021-01-11,JERRY STANLEY,M,1988-02-28,3572,HERNANDEZCYNTHIA@HOTMAIL.COM +1565,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2021-01-11,LANCE HOFFMAN,M,2019-08-03,7407,NORTONMARC@HOTMAIL.COM +1566,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2021-01-11,KEVIN KING,M,1990-11-02,7509,LVEGA@GMAIL.COM +1567,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2021-01-11,ASHLEY GORDON,F,1924-12-06,9121,TOCONNOR@YAHOO.COM +1568,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2021-01-11,DOUGLAS JOSEPH,M,2012-08-13,5340,WILLIAMWILSON@HOTMAIL.COM +1569,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2021-01-11,RAYMOND ELLIS,M,2005-04-07,3061,VINCENT52@HOTMAIL.COM +1570,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2021-01-11,STEPHEN SANCHEZ,M,1994-11-24,3023,LOWERYSARAH@GMAIL.COM +1571,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2021-01-11,AMY ROBINSON,F,1996-02-14,6430,NMARTIN@YAHOO.COM +1572,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2021-01-11,TANYA BARRERA,F,2013-06-19,7136,UGONZALEZ@GMAIL.COM +1573,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2021-01-11,JESUS MILLER,M,1917-01-22,9220,VANGSHAWN@GMAIL.COM +1574,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2021-01-11,NICOLE WATKINS,F,1911-03-05,2438,PAUL24@YAHOO.COM +1575,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2021-01-11,PATRICK PEREZ,M,1981-07-23,3138,IMOORE@YAHOO.COM +1576,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2021-01-11,WILLIAM LEWIS,M,1951-11-08,2643,WEBSTERJAMES@GMAIL.COM +1577,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2021-01-11,ASHLEY REEVES,F,1919-05-09,5607,SHAFFERSANDRA@GMAIL.COM +1578,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2021-01-12,LUKE DOUGHERTY,M,1927-05-27,5773,WILLIAMTAYLOR@YAHOO.COM +1579,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2021-01-12,JACOB STOUT,M,1940-12-25,3555,ULUTZ@GMAIL.COM +1580,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2021-01-12,BRENDA ROBLES,F,1983-09-17,6509,MARYMCKEE@YAHOO.COM +1581,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2021-01-12,JENNIFER WOODARD,F,2000-11-23,7247,DANIEL14@HOTMAIL.COM +1582,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2021-01-12,JOHN MILLER,M,1978-07-03,7005,ROBERTOBOWEN@YAHOO.COM +1583,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2021-01-12,JEFFREY JACOBSON,M,1963-07-20,7105,MICHAEL83@HOTMAIL.COM +1584,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2021-01-12,TIMOTHY LEWIS,M,1966-08-25,5475,SANDERSDEBORAH@YAHOO.COM +1585,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2021-01-12,JESSICA SCHMITT,F,1932-10-13,5595,MSTANLEY@GMAIL.COM +1586,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2021-01-12,DAVID HODGE,M,1914-10-23,3412,MARGARETFIGUEROA@HOTMAIL.COM +1587,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2021-01-12,THOMAS FRANKLIN,M,1990-04-15,2443,SANDOVALLAWRENCE@YAHOO.COM +1588,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2021-01-12,KRISTA CLAYTON,F,1975-11-12,6625,MAURICE27@HOTMAIL.COM +1589,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2021-01-12,LAURA RIVAS,F,1941-07-13,7305,BETTYRODRIGUEZ@HOTMAIL.COM +1590,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2021-01-12,RANDY HAWKINS,M,1996-02-29,9000,PRIVAS@GMAIL.COM +1591,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2021-01-12,CHARLES COOK,M,2020-11-28,1670,LEROY48@HOTMAIL.COM +1592,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2021-01-12,RICHARD RODGERS,M,1928-03-10,8504,BLAKE44@GMAIL.COM +1593,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2021-01-12,BEVERLY GONZALEZ,F,1911-12-20,6105,MUELLERJOSEPH@GMAIL.COM +1594,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2021-01-12,MELANIE MASON,F,1933-04-08,9421,TAYLORBRITTANY@YAHOO.COM +1595,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2021-01-13,KATHERINE JACKSON,F,1912-08-14,7226,JAVIER55@YAHOO.COM +1596,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2021-01-13,TERRI OLSON,F,2009-01-20,3190,NATHAN96@GMAIL.COM +1597,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2021-01-13,COURTNEY MARTINEZ,F,1991-10-12,1650,SANDY97@HOTMAIL.COM +1598,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2021-01-13,RICHARD HATFIELD,M,1991-04-17,3487,BRIANPOWELL@GMAIL.COM +1599,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2021-01-13,SHELLEY SWANSON,F,1923-02-06,6503,GREGORY87@GMAIL.COM +1600,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2021-01-13,VIRGINIA MITCHELL,F,2021-05-23,5741,ALLISON88@HOTMAIL.COM +1601,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2021-01-13,MATTHEW BENNETT,M,1954-05-18,2301,FMORAN@YAHOO.COM +1602,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2021-01-13,STEPHEN MOORE,M,1905-12-16,5276,RANDY37@YAHOO.COM +1603,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2021-01-13,BRANDON SMITH,M,1924-10-23,7003,SAMANTHA03@GMAIL.COM +1604,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2021-01-14,CHRISTINE FLOWERS,F,1911-04-15,5275,MICHAEL56@YAHOO.COM +1605,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2021-01-14,MELISSA ADAMS,F,1988-01-21,5717,PREYES@HOTMAIL.COM +1606,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2021-01-14,MR. JOSHUA KNIGHT,M,2002-12-15,7001,GABRIELGALLAGHER@HOTMAIL.COM +1607,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2021-01-14,DANIELLE PETERSON,F,1969-05-24,2814,KJOHNSON@HOTMAIL.COM +1608,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2021-01-14,BLAKE CAMPBELL,M,1938-04-11,2128,HERRINGCONNIE@HOTMAIL.COM +1609,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2021-01-14,NICHOLAS HUNTER,M,2019-04-18,5721,TAYLORDAVID@HOTMAIL.COM +1610,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2021-01-14,MICHAEL VILLA,M,1908-04-10,9101,PAULDENISE@GMAIL.COM +1611,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2021-01-14,LOGAN DECKER,M,1924-10-31,2747,JOHNSONGLORIA@YAHOO.COM +1612,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2021-01-14,SARAH MARTIN,F,1932-01-06,4230,KENNETH21@HOTMAIL.COM +1613,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2021-01-14,KEVIN ROBLES,M,1935-08-02,4147,DANIEL72@GMAIL.COM +1614,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2021-01-14,ERICA WARE,F,1915-10-23,5724,KEVIN51@YAHOO.COM +1615,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2021-01-14,JAMES HOFFMAN,M,1963-08-30,9310,JAMIEJOHNSON@HOTMAIL.COM +1616,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2021-01-14,HEATHER COMBS,F,1993-07-20,2240,KELLIOTT@GMAIL.COM +1617,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2021-01-15,MICHAEL MONTOYA,M,1979-11-02,2701,LMARTINEZ@GMAIL.COM +1618,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2021-01-15,MARIO JOHNSON,M,1962-06-13,9111,TSOLIS@GMAIL.COM +1619,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2021-01-15,SUZANNE WILLIAMS,F,1948-11-21,8175,BRENDA30@YAHOO.COM +1620,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2021-01-15,ALEXANDER MCCOY,M,1938-03-01,5515,WENDY07@GMAIL.COM +1621,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2021-01-15,CHRISTINA HOGAN,F,1944-10-22,5365,JORDANGARY@HOTMAIL.COM +1622,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2021-01-15,JACQUELINE WILSON,F,1924-07-08,7160,JESPARZA@YAHOO.COM +1623,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2021-01-15,SARAH DICKERSON,F,1921-03-03,3580,ANDERSONNICHOLAS@GMAIL.COM +1624,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2021-01-15,CHRISTOPHER BROWN,M,2007-07-16,5733,WMARTINEZ@YAHOO.COM +1625,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2021-01-15,MELISSA SOLIS,F,1998-11-29,8111,DIAMONDCLARK@GMAIL.COM +1626,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2021-01-15,RACHEL PARKER,F,1914-06-16,8160,MICHAEL14@HOTMAIL.COM +1627,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2021-01-15,JOSEPH HARRIS,M,2005-02-05,7519,BRITTNEY42@YAHOO.COM +1628,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2021-01-15,ROY THOMAS,M,1921-08-04,2808,LEWISROBIN@YAHOO.COM +1629,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2021-01-15,MICHAEL WILLIAMS,M,1965-08-04,1640,JAMESLEWIS@HOTMAIL.COM +1630,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2021-01-15,JOHN OBRIEN,M,1985-07-29,5417,BRANDON10@HOTMAIL.COM +1631,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2021-01-15,MEGAN MOSS,F,1962-11-19,2508,MICHELLETHOMPSON@GMAIL.COM +1632,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2021-01-15,SANDRA RODRIGUEZ,F,1952-02-20,7503,BENJAMIN95@HOTMAIL.COM +1633,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2021-01-15,KENNETH ADAMS,M,1911-05-10,1761,DOUGLAS67@HOTMAIL.COM +1634,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2021-01-15,KATHY JONES,F,1951-11-25,3003,BSCOTT@YAHOO.COM +1635,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2021-01-16,BENJAMIN REESE,M,1945-10-10,1889,WRIGHTRALPH@GMAIL.COM +1636,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2021-01-16,JACOB GARNER,M,2003-11-27,6207,WARNERMICHAEL@YAHOO.COM +1637,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2021-01-16,DAVID THOMAS,M,1992-05-26,3132,ROSEFREDERICK@GMAIL.COM +1638,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2021-01-16,ANA EVANS,F,1930-03-29,7226,BARBARAFARRELL@GMAIL.COM +1639,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2021-01-16,CHRISTOPHER PARK,M,1923-12-05,9203,WILSONDEBRA@GMAIL.COM +1640,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2021-01-16,ERIC BARR,M,1993-06-21,1744,PATTERSONJONATHAN@GMAIL.COM +1641,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2021-01-16,ANNA MORALES,F,1921-10-07,4651,WOODJULIE@YAHOO.COM +1642,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2021-01-16,NATHAN ANDERSON,M,1921-10-29,6075,PARKERWILLIAM@GMAIL.COM +1643,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2021-01-16,JOHN YU,M,1928-12-22,3380,AARON55@YAHOO.COM +1644,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2021-01-16,HEATHER SANTOS,F,1952-12-05,1684,WILSONJULIE@YAHOO.COM +1645,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2021-01-16,TINA CARROLL,F,1950-05-14,2301,DAWN50@HOTMAIL.COM +1646,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2021-01-16,ANTHONY DEAN,M,1935-11-08,3009,AARONSMITH@YAHOO.COM +1647,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2021-01-16,SAMUEL RIVERA,M,1953-01-27,2311,HYODER@GMAIL.COM +1648,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2021-01-17,CHARLES HUGHES,M,1992-03-17,2806,LOGANRONALD@HOTMAIL.COM +1649,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2021-01-17,JUSTIN BASS PHD,M,1921-06-13,3543,GVELEZ@YAHOO.COM +1650,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2021-01-17,JOANNA MONTOYA,F,1992-11-18,3712,TAMMYCLARK@HOTMAIL.COM +1651,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2021-01-17,RANDY ROJAS,M,1907-10-02,4164,CWEBB@HOTMAIL.COM +1652,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2021-01-17,LORI RANDALL,F,1969-10-19,6455,TAMI95@YAHOO.COM +1653,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2021-01-17,ROBERTO JOSEPH,M,1981-02-01,6036,TREED@GMAIL.COM +1654,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2021-01-17,SHERRY JONES,F,1968-09-25,2605,CARRIESIMS@YAHOO.COM +1655,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2021-01-17,MICHAEL FISHER,M,1992-07-18,3000,MCLAUGHLINCHERYL@YAHOO.COM +1656,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2021-01-17,BRIAN MYERS,M,1919-04-29,6734,KNIGHTMATTHEW@YAHOO.COM +1657,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2021-01-17,JOHN BROWN,M,1981-10-30,4504,SMITHAMANDA@GMAIL.COM +1658,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2021-01-17,JOSEPH BRIGGS,M,1998-03-10,8415,HERNANDEZBRIAN@GMAIL.COM +1659,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2021-01-17,ELIZABETH LEBLANC,F,1959-08-27,9407,SHELLEY61@GMAIL.COM +1660,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2021-01-18,AMBER BROWN DDS,F,1998-12-11,3206,RACHELMCDONALD@YAHOO.COM +1661,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2021-01-18,KRISTIN PERKINS,F,2009-03-31,3355,SAMUEL60@GMAIL.COM +1662,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2021-01-18,DAWN HUGHES,F,1964-05-23,1613,SHARON90@HOTMAIL.COM +1663,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2021-01-18,ANN JORDAN,F,1943-12-08,5609,RICHARD96@YAHOO.COM +1664,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2021-01-18,NICHOLAS FISHER,M,1931-06-21,5260,HARRISROBERT@YAHOO.COM +1665,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2021-01-18,JOSHUA JONES,M,1926-11-30,3346,HENDERSONCHRISTOPHER@YAHOO.COM +1666,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2021-01-18,JUSTIN ALVARADO,M,1934-12-15,1816,HARRYMASON@HOTMAIL.COM +1667,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2021-01-18,GRACE REYNOLDS,F,1920-03-17,3081,CHRISTOPHER92@YAHOO.COM +1668,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2021-01-18,KRISTIE DRAKE,F,2019-07-30,7630,WILLIAMSSAMANTHA@YAHOO.COM +1669,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2021-01-19,AARON KIM,M,1957-11-27,6721,CHRISTOPHERWOOD@YAHOO.COM +1670,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2021-01-19,NICOLE CASTANEDA,F,2001-04-20,4109,NICOLE64@HOTMAIL.COM +1671,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS GEOLÓGICAS,2021-01-19,RICKEY WILLIAMS MD,M,1913-02-26,2202,SETH53@GMAIL.COM +1672,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2021-01-19,CRISTINA HUMPHREY,F,1963-01-31,1804,ANNECONWAY@GMAIL.COM +1673,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2021-01-19,MEAGAN HARMON,F,1995-06-18,9101,WENDYFIGUEROA@HOTMAIL.COM +1674,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2021-01-19,LOUIS BENNETT,M,1954-05-14,2717,KAREN93@GMAIL.COM +1675,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2021-01-19,JILL SANFORD MD,F,1957-06-13,2449,WCOX@GMAIL.COM +1676,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2021-01-19,JOSHUA BROWN,M,1937-09-25,2309,KMCCULLOUGH@GMAIL.COM +1677,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2021-01-19,RYAN MALDONADO,M,2014-12-31,1746,GAVINHARRIS@GMAIL.COM +1678,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2021-01-19,ANDREA RANDOLPH,F,2011-10-09,5755,SANTOSHEIDI@GMAIL.COM +1679,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2021-01-19,DAVID ROWE,M,1943-08-19,7167,LUIS40@GMAIL.COM +1680,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2021-01-19,RYAN CLAY,M,1914-07-06,2255,MICHAEL23@GMAIL.COM +1681,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2021-01-19,JON KEY,M,1963-06-08,2309,GCOOPER@YAHOO.COM +1682,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2021-01-19,JOHN WRIGHT,M,1963-07-07,1614,KIMBERLYSTONE@GMAIL.COM +1683,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2021-01-19,PETER WILLIAMS,M,1971-05-14,6723,ASHLEY12@HOTMAIL.COM +1684,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2021-01-19,REBEKAH RIOS,F,1913-11-02,8309,TIMOTHYEVERETT@GMAIL.COM +1685,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2021-01-19,CHRISTINE REYNOLDS,F,2003-05-13,9121,APRILCLARK@GMAIL.COM +1686,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2021-01-20,ROBERT GUERRERO,M,1951-06-10,7406,ZPORTER@HOTMAIL.COM +1687,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2021-01-20,KATELYN WRIGHT,F,1931-10-02,3563,GLEWIS@GMAIL.COM +1688,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2021-01-20,MELANIE OCONNOR,F,1931-04-27,3190,JUSTINBELL@GMAIL.COM +1689,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2021-01-20,GEORGE CUEVAS,M,1975-07-12,3254,WENDYKNIGHT@HOTMAIL.COM +1690,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2021-01-20,MARY ALVAREZ,F,1920-10-31,9035,IWRIGHT@YAHOO.COM +1691,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2021-01-20,SHERI SCHROEDER,F,1997-04-12,5701,BURNSNICOLE@GMAIL.COM +1692,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2021-01-21,JEROME MANNING,M,2018-11-12,7612,BROWNBRIAN@YAHOO.COM +1693,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2021-01-21,TINA THOMAS,F,1974-08-25,1670,JESSICA34@YAHOO.COM +1694,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2021-01-21,MICHAEL PALMER,M,1923-06-16,6101,THERESAHERNANDEZ@GMAIL.COM +1695,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2021-01-21,ERICA PACE,F,1946-08-20,3016,ALISON24@HOTMAIL.COM +1696,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2021-01-21,KEVIN ALEXANDER,M,1987-04-22,2919,JAREDGRIMES@YAHOO.COM +1697,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2021-01-21,ASHLEY HUGHES,F,1909-11-29,3363,IBYRD@YAHOO.COM +1698,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2021-01-21,JONATHAN ORTEGA,M,1953-05-14,2248,DAVID52@HOTMAIL.COM +1699,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2021-01-21,JULIE CRANE,F,1972-11-08,3232,WGIBBS@GMAIL.COM +1700,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2021-01-21,JONATHAN THOMAS,M,1938-06-13,5407,AMYANDREWS@GMAIL.COM +1701,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2021-01-21,CHRISTINA MCCLURE,F,1919-01-29,8103,BRADFORDKATHLEEN@GMAIL.COM +1702,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2021-01-21,KAREN HURST,F,1949-07-21,7020,RODNEY75@GMAIL.COM +1703,UNIV. NACIONAL DEL COMAHUE,FARMACIA,2021-01-21,RICKY LEE,M,1953-06-02,8417,STODD@HOTMAIL.COM +1704,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2021-01-22,SHARON DAVIDSON,F,2021-05-06,8508,ELIJAHHAWKINS@GMAIL.COM +1705,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2021-01-22,LOGAN STONE,M,1961-12-14,6705,STEVENGORDON@HOTMAIL.COM +1706,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2021-01-22,JORGE MOORE,M,1987-12-31,5547,RYAN99@HOTMAIL.COM +1707,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2021-01-22,TODD OCHOA,M,1944-01-11,6551,LMCMAHON@YAHOO.COM +1708,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2021-01-22,MICHAEL ROBINSON,M,1967-12-30,7613,MFRANCIS@YAHOO.COM +1709,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2021-01-22,RYAN JENKINS,M,1942-11-11,6721,MICHAEL90@HOTMAIL.COM +1710,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2021-01-22,ELIZABETH MARTINEZ DVM,F,2012-08-23,2146,HOLLOWAYRICKY@YAHOO.COM +1711,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2021-01-23,MOLLY FARMER,F,1943-04-29,2720,ARAMIREZ@HOTMAIL.COM +1712,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2021-01-23,KENNETH FLOWERS,M,1964-01-11,2754,HARRISTYLER@GMAIL.COM +1713,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2021-01-23,DAVID GREENE MD,M,1963-07-25,2845,DALTON68@YAHOO.COM +1714,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2021-01-23,CHARLES WILEY,M,1919-03-23,3440,ASHLEYSANCHEZ@GMAIL.COM +1715,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2021-01-23,KEVIN HAMILTON,M,1910-03-18,4514,JACQUELINE98@YAHOO.COM +1716,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2021-01-23,AMY LITTLE,F,1952-06-08,5541,CHRISTY85@HOTMAIL.COM +1717,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2021-01-23,MARK ARNOLD,M,2020-03-22,5773,CAMPBELLSAMANTHA@HOTMAIL.COM +1718,UNIV. NACIONAL DEL COMAHUE,ARQUITECTURA,2021-01-23,LAUREN WOOD,F,1975-03-03,3014,BRANDI48@GMAIL.COM +1719,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2021-01-23,ROBERTA WILLIAMS,F,1915-01-20,6387,MICHELLEWILLIS@HOTMAIL.COM +1720,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2021-01-23,DAWN JEFFERSON,F,1956-11-23,3551,JUAN36@YAHOO.COM +1721,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2021-01-23,KIMBERLY PRICE,F,2015-08-24,9303,DAVIDCOOKE@HOTMAIL.COM +1722,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2021-01-23,BARBARA VAUGHN,F,1982-11-08,6017,WILLIAMSONKAYLA@YAHOO.COM +1723,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2021-01-24,CYNTHIA SNYDER,F,1987-12-08,2175,WEBERSABRINA@YAHOO.COM +1724,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2021-01-24,DANIEL ORTEGA PHD,M,2011-11-10,6315,FRANK71@HOTMAIL.COM +1725,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2021-01-24,JOSHUA CARTER,M,1965-11-08,5711,HGREER@YAHOO.COM +1726,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2021-01-24,FRANK WARREN II,M,1921-04-26,7106,AJOHNSON@GMAIL.COM +1727,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2021-01-25,RICHARD MACIAS,M,1912-08-27,7307,YKIM@YAHOO.COM +1728,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2021-01-25,BRAD HERNANDEZ,M,1934-03-22,5345,ALYSSA88@YAHOO.COM +1729,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2021-01-25,KRISTINE EDWARDS,F,2012-02-16,4231,MDURAN@YAHOO.COM +1730,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2021-01-25,BRANDI HALL,F,1972-01-15,4504,PUGHTIMOTHY@GMAIL.COM +1731,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2021-01-25,TONYA STEELE,F,1937-11-05,1646,LATOYA42@YAHOO.COM +1732,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN KINESIOLOGÍA Y FISIATRÍA,2021-01-25,WENDY PARKER,F,1914-08-21,1614,ISANCHEZ@GMAIL.COM +1733,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2021-01-25,REGINA GRIFFIN,F,1915-11-09,2607,DEREKBARBER@YAHOO.COM +1734,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2021-01-25,JAMES PETERSON,M,1979-01-15,3522,UMCKEE@HOTMAIL.COM +1735,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2021-01-25,DEANNA EVANS,F,1983-03-17,3156,CHRISTOPHER84@YAHOO.COM +1736,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2021-01-25,ALLISON HERNANDEZ,F,1953-04-18,8412,DALTONWILLIAM@HOTMAIL.COM +1737,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2021-01-25,KEITH BROWN,M,1957-01-06,5773,SAMANTHAGORDON@GMAIL.COM +1738,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2021-01-25,RICHARD BOOTH,M,1989-01-13,2183,MORTONSTACY@GMAIL.COM +1739,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2021-01-26,STEPHANIE MCKNIGHT,F,2014-12-30,7505,XFLORES@GMAIL.COM +1740,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2021-01-26,CYNTHIA CARTER,F,1969-05-22,1631,JESSICA97@YAHOO.COM +1741,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2021-01-26,CANDACE JONES MD,F,2018-03-15,9305,HARDINKEITH@YAHOO.COM +1742,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2021-01-26,MR. CHRISTOPHER JACKSON,M,1958-09-07,5735,CALDERONBRITTANY@GMAIL.COM +1743,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2021-01-26,DIANA HALL,F,2021-04-12,3125,RICHARD95@YAHOO.COM +1744,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2021-01-26,TYLER IRWIN,M,1997-05-02,8316,DUNNTRACY@HOTMAIL.COM +1745,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2021-01-26,BENJAMIN FOSTER,M,1984-06-03,4622,BRANDIMCCULLOUGH@HOTMAIL.COM +1746,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2021-01-26,CHRISTOPHER WATTS,M,1990-01-31,9050,GSNYDER@YAHOO.COM +1747,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2021-01-26,HEIDI WARREN,F,1977-09-19,1655,MWEAVER@YAHOO.COM +1748,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2021-01-26,JAMIE MARTIN,F,1922-12-25,2216,ANNE53@HOTMAIL.COM +1749,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS ANTROPOLÓGICAS,2021-01-26,TODD GORDON,M,1979-12-08,3381,MUELLERDONNA@GMAIL.COM +1750,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2021-01-26,DEVIN WILLIAMS JR.,M,1931-01-12,1832,JOSEPH95@GMAIL.COM +1751,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2021-01-26,WILLIAM CONTRERAS,M,1909-04-18,2201,NICOLEJONES@HOTMAIL.COM +1752,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2021-01-27,TIMOTHY HERNANDEZ,M,1918-03-03,5321,JULIEKIM@GMAIL.COM +1753,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2021-01-27,JESSICA CURRY,F,2002-07-28,1907,JEFFREY86@GMAIL.COM +1754,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2021-01-27,NICHOLAS HENSON,M,1978-08-23,2843,JAMESKEVIN@GMAIL.COM +1755,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2021-01-27,MATTHEW BRIDGES,M,1908-01-11,1984,TAYLORPEREZ@HOTMAIL.COM +1756,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2021-01-27,COURTNEY BRYAN,F,1991-01-07,1856,HOWARDZACHARY@HOTMAIL.COM +1757,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2021-01-27,BRANDON PEREZ,M,1986-03-20,2805,MICHELLESANCHEZ@YAHOO.COM +1758,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2021-01-27,HERBERT JACKSON,M,2020-12-23,5311,SOLISMICHAEL@HOTMAIL.COM +1759,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2021-01-27,GINA HOFFMAN,F,1969-03-07,2503,MICHAEL52@HOTMAIL.COM +1760,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2021-01-27,TROY HARRIS,M,1907-02-03,3011,BEVERLYCOX@GMAIL.COM +1761,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2021-01-27,MICHAEL MORALES,M,2004-07-19,2763,MCFARLANDJOHNNY@YAHOO.COM +1762,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2021-01-27,CHRISTOPHER SALAZAR,M,1914-02-22,6505,CONNOR46@YAHOO.COM +1763,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA EDUCACIÓN ,2021-01-28,BRANDON LANG,M,2006-05-01,9220,JOSEPHBOYD@HOTMAIL.COM +1764,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2021-01-28,PATRICK CHRISTENSEN,M,1917-07-29,2622,JACQUELINE29@GMAIL.COM +1765,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2021-01-28,GEOFFREY TAYLOR,M,1965-01-18,5560,MARGARET95@GMAIL.COM +1766,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2021-01-28,ROY MICHAEL,M,1946-05-21,5557,GREGORY43@HOTMAIL.COM +1767,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2021-01-28,DR. NICOLE BLACK MD,F,1921-01-12,1768,CHOICARRIE@YAHOO.COM +1768,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2021-01-28,LISA ESPINOZA,F,1924-04-13,9220,STEVEN98@GMAIL.COM +1769,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2021-01-28,AMBER HAWKINS,F,2014-12-20,3449,RYAN00@GMAIL.COM +1770,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2021-01-28,ALICIA HALEY,F,2000-10-02,3023,SHAFFERJOSEPH@GMAIL.COM +1771,UNIV. NACIONAL DEL COMAHUE,CIENCIAS VETERINARIAS,2021-01-28,JUSTIN MCDONALD,M,2016-11-27,6513,ZTHOMAS@HOTMAIL.COM +1772,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2021-01-28,MONIQUE CERVANTES,F,1978-12-09,5421,SARAH24@HOTMAIL.COM +1773,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2021-01-28,WHITNEY CARR,F,1907-07-25,5501,CHRISTINA10@YAHOO.COM +1774,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2021-01-28,ROBERT SMITH,M,1912-02-06,1885,MARKRUSSELL@HOTMAIL.COM +1775,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2021-01-28,BRIAN RICHARDS,M,2016-02-03,1735,BROWNELIZABETH@HOTMAIL.COM +1776,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2021-01-29,ASHLEY FROST,F,1928-02-18,8521,HRASMUSSEN@HOTMAIL.COM +1777,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2021-01-29,JILL TERRY,F,2012-02-28,2747,JEFFREYGARNER@HOTMAIL.COM +1778,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2021-01-29,DEBRA JOHNSON,F,1935-10-22,6078,LANGJEREMY@YAHOO.COM +1779,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN RELACIONES DEL TRABAJO ,2021-01-29,STEPHANIE LOGAN,F,1981-04-23,7605,YFISHER@HOTMAIL.COM +1780,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2021-01-29,MELISSA DANIELS,F,1974-02-22,4518,RIVERAERIC@YAHOO.COM +1781,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2021-01-29,CASEY WARD,M,1913-11-16,2177,RYAN94@YAHOO.COM +1782,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PSICOLOGÍA,2021-01-29,JENNIFER DAVIS MD,F,1950-11-10,6453,LHERNANDEZ@HOTMAIL.COM +1783,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2021-01-29,LINDSEY KIM,F,1951-11-30,7114,DAVIDBUSH@HOTMAIL.COM +1784,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2021-01-29,DARREN HOLMES,M,1942-06-14,3076,JHALL@YAHOO.COM +1785,UNIV. NACIONAL DEL COMAHUE,CONTADOR PÚBLICO ,2021-01-29,FELICIA SMITH,F,1969-09-20,2707,ROBINSONCAITLIN@YAHOO.COM +1786,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2021-01-29,RACHEL MALONE,F,1973-04-30,9040,JAMES64@GMAIL.COM +1787,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2021-01-29,LISA PERRY,F,1941-11-26,3117,BASSSARAH@YAHOO.COM +1788,UNIV. NACIONAL DEL COMAHUE,ACTUARIO ,2021-01-29,TIMOTHY BROWN,M,2003-08-28,5743,JONATHANMILLER@HOTMAIL.COM +1789,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2021-01-29,DEBRA JOHNSON,F,1974-03-19,3443,LOVEIAN@YAHOO.COM +1790,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2021-01-29,CARRIE JOHNSON,F,1956-11-30,6305,NMCLEAN@HOTMAIL.COM +1791,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2021-01-30,SARAH JOHNSTON,F,1961-10-23,1607,UBUSH@GMAIL.COM +1792,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA Y TECNOLOGÍA DE ALIMENTOS,2021-01-30,KELLY SIMPSON,F,2012-11-09,5624,YCOFFEY@YAHOO.COM +1793,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2021-01-30,LINDA NASH,F,1976-08-06,5275,ORTEGADAVE@HOTMAIL.COM +1794,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA MECÁNICA,2021-01-30,JONATHAN TAYLOR,M,1975-02-12,2943,ALANBENNETT@YAHOO.COM +1795,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS DE LA COMPUTACIÓN,2021-01-30,ISAAC SUAREZ,M,2020-12-08,4109,ALAWRENCE@YAHOO.COM +1796,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2021-01-30,ALLEN PHELPS,M,1913-09-08,3188,YHARRIS@HOTMAIL.COM +1797,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2021-01-30,GREGORY WRIGHT,M,1977-10-28,6475,SARAHSLOAN@YAHOO.COM +1798,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS AMBIENTALES,2021-01-30,JEFFREY WARD,M,1937-10-24,6665,JASMINE13@GMAIL.COM +1799,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2021-01-30,EMILY ALEXANDER,F,1951-09-10,4187,ZPARRISH@HOTMAIL.COM +1800,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2021-01-30,RICHARD RICE,M,1982-03-06,1980,MORALESTHOMAS@HOTMAIL.COM +1801,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN MUSICOTERAPIA,2021-01-30,JOHN SIMPSON,M,1916-11-18,3342,JENNA23@YAHOO.COM +1802,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN TERAPIA OCUPACIONAL,2021-01-30,CORY CHURCH MD,M,1976-01-24,3334,ASHLEYWILLIAMS@GMAIL.COM +1803,UNIV. NACIONAL DEL COMAHUE,BIOQUÍMICA,2021-01-30,SHAWN HAHN,M,2006-02-23,8115,CHRISTY55@GMAIL.COM +1804,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA ELECTRÓNICA,2021-01-30,RICHARD HARRISON,M,1917-05-13,3071,PIERCEHEATHER@GMAIL.COM +1805,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ADMINISTRACIÓN ,2021-01-30,RUSSELL DAVIS,M,1964-12-17,6405,DCHAN@GMAIL.COM +1806,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2021-01-30,LAWRENCE WHEELER,M,1991-09-29,5272,PAULTHOMAS@HOTMAIL.COM +1807,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2021-01-30,WILLIAM PRICE,M,1920-03-11,2732,SWANSONJOSEPH@GMAIL.COM +1808,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2021-01-30,KATRINA COOKE,F,2012-04-10,3376,MICHELESMITH@GMAIL.COM +1809,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2021-01-30,KRISTEN LUCERO,F,1919-09-19,1923,WHITEMATTHEW@HOTMAIL.COM +1810,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2021-01-30,TERESA COOPER,F,1931-05-13,3328,XMANN@GMAIL.COM +1811,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PLANIFICACIÓN Y DISEÑO DEL PAISAJE,2021-01-31,ANGELA COPELAND,F,1984-06-03,6513,EDANIELS@YAHOO.COM +1812,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2021-01-31,CHRISTOPHER ESTRADA,M,1964-11-14,2812,WILLIAMPORTER@HOTMAIL.COM +1813,UNIV. NACIONAL DEL COMAHUE,MEDICINA,2021-01-31,MEGAN GLOVER,F,2021-01-25,8129,JONESDEBORAH@HOTMAIL.COM +1814,UNIV. NACIONAL DEL COMAHUE,INGENIERÍA EN INFORMÁTICA,2021-01-31,ANNA RICHMOND,F,1964-01-14,4753,FTHOMPSON@YAHOO.COM +1815,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN GESTIÓN DE AGROALIMENTOS,2021-01-31,WILLIAM TAYLOR,M,1915-06-20,2449,HOLLY49@GMAIL.COM +1816,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2021-01-31,THERESA GONZALES,F,1963-03-25,8208,PALMERLORI@GMAIL.COM +1817,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2021-01-31,ASHLEY OSBORNE,F,1965-03-26,2715,RCOFFEY@HOTMAIL.COM +1818,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIA POLÍTICA ,2021-01-31,ALAN CRANE,M,1906-08-15,2216,BRANDI05@YAHOO.COM +1819,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN SOCIOLOGÍA ,2021-01-31,TROY MASON,M,2015-01-19,6345,MARGARET95@YAHOO.COM +1820,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN PRODUCCIÓN DE BIOIMAGENES,2021-01-31,LISA HANNA DVM,F,1959-11-29,2615,MCDONALDJOSHUA@HOTMAIL.COM +1821,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2021-01-31,LANCE WILLIAMS,M,1982-10-11,7247,JENNIFER42@GMAIL.COM +1822,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2021-01-31,ABIGAIL MAYS,F,1961-09-12,9225,MARIA16@YAHOO.COM +1823,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2021-01-31,RYAN DAVIS,M,1934-12-23,3328,PATRICIAZAMORA@GMAIL.COM +1824,UNIV. NACIONAL DEL COMAHUE,DISEÑO DE IMAGEN Y SONIDO,2021-02-01,JAMES HODGE,M,1948-04-14,8160,NORRISSTEPHEN@GMAIL.COM +1825,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2021-02-01,DR. JENNIFER BRYANT MD,F,1997-03-14,8319,FJOHNSON@YAHOO.COM +1826,UNIV. NACIONAL DEL COMAHUE,TÉCNICO PARA BIOTERIOS ,2021-02-01,KEITH RICHARDSON,M,2018-07-01,3466,KINGJOSEPH@YAHOO.COM +1827,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN CIENCIAS BIOLÓGICAS,2021-02-01,RICHARD ROBLES,M,2010-07-15,8324,KYLEGRAHAM@HOTMAIL.COM +1828,UNIV. NACIONAL DEL COMAHUE,LICENCIATURA EN ARTES,2021-02-01,STEPHANIE WILLIAMS,F,1916-01-18,5471,JVALDEZ@HOTMAIL.COM +1829,UNIV. NACIONAL DEL COMAHUE,DISEÑO INDUSTRIAL,2021-02-01,JENNIFER COHEN,F,1984-08-13,4157,RRAMIREZ@HOTMAIL.COM +1830,UNIV. NACIONAL DEL COMAHUE,AGRONOMÍA,2021-02-01,PAUL BYRD,M,1944-08-19,1746,SHEILA73@YAHOO.COM diff --git a/files/GBUNSalvador_select.csv b/files/GBUNSalvador_select.csv new file mode 100644 index 00000000..9ad9a4bd --- /dev/null +++ b/files/GBUNSalvador_select.csv @@ -0,0 +1,1905 @@ +,universidad,carrera,fecha_de_inscripcion,nombre,sexo,fecha_nacimiento,localidad,email +0,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,01-Sep-20,CAROL_DOYLE,F,27-Jul-06,COLONIA_LA_BLANQUITA,ANTHONY88@GMAIL.COM +1,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,01-Sep-20,HEIDI_TRAN,F,15-Jul-28,LAGUNA_DEL_BARRO,TODD44@HOTMAIL.COM +2,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,01-Sep-20,RACHAEL_HARRINGTON,F,13-Oct-64,ANTONIO_CARBONI,ZCANTRELL@YAHOO.COM +3,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,01-Sep-20,RYAN_SILVA,M,13-Jan-25,COMANDANTE_LEAL,HEATHER60@GMAIL.COM +4,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,01-Sep-20,TIFFANY_KNIGHT,F,08-Sep-76,ALFREDO_DEMARCHI,BWARNER@GMAIL.COM +5,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,01-Sep-20,TYLER_ROSS,M,09-Sep-29,ARROYO_DE_LA_CRUZ,MARTINEZSTEPHANIE@GMAIL.COM +6,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,01-Sep-20,CAITLYN_FARRELL,F,16-Nov-40,ALDEA_APELEG,DROMAN@HOTMAIL.COM +7,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,01-Sep-20,ALBERT_REILLY,M,20-Apr-18,PUERTO_OJO_DE_AGUA,AMYSIMMONS@YAHOO.COM +8,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,01-Sep-20,KIM_GARZA,F,31-Dec-28,AGUA_LINDA,LWILSON@HOTMAIL.COM +9,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,01-Sep-20,DONNA_HICKS,F,05-Sep-34,PLANICIE_BANDERITA,KELLEYJAMES@GMAIL.COM +10,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,01-Sep-20,DAVID_NGUYEN,M,26-Feb-65,CAMPO_GARCIA,OWENDAWN@YAHOO.COM +11,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,02-Sep-20,NANCY_HOPKINS,F,22-Oct-12,HARAS_SAN_JACINTO,TARAKOCH@GMAIL.COM +12,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,02-Sep-20,ANNA_WILLIAMS,F,21-Jul-99,LA_LIMPIA,ELIZABETH50@YAHOO.COM +13,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,02-Sep-20,DARRELL_VILLA,M,04-Dec-14,AGUA_BLANCA,SKIM@GMAIL.COM +14,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,02-Sep-20,TAMMY_YOUNG,F,08-Jun-99,EMPALME_FRONTERA,USHERMAN@GMAIL.COM +15,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,02-Sep-20,RACHEL_MILLER,F,17-Dec-78,ABRA_DE_HINOJO,BRIAN17@GMAIL.COM +16,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,02-Sep-20,KRISTEN_LONG,F,17-Mar-08,COLONIA_MACKINLAY,BEARDMELINDA@YAHOO.COM +17,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,02-Sep-20,MRS._ANGELA_WILSON,F,31-Jul-53,AGUA_DEL_SIMBOL,TERESA23@GMAIL.COM +18,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,02-Sep-20,MELANIE_CHAN,F,24-May-72,AGUA_DE_TORRE,HOOVERJAMES@HOTMAIL.COM +19,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,02-Sep-20,VINCENT_ROMERO,M,23-Aug-19,CUCULLU,VPETERSON@HOTMAIL.COM +20,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,02-Sep-20,SHARON_MALDONADO,F,24-Dec-68,LA_DULCE,XCALDERON@YAHOO.COM +21,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,02-Sep-20,SHAWN_HOLT,M,16-Sep-11,CAMPO_SAN_JOSE,NATHAN85@YAHOO.COM +22,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,02-Sep-20,MELISSA_WRIGHT,F,06-Jan-95,CAMPO_LA_FLOR_LOS_RALOS,VWILSON@HOTMAIL.COM +23,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,02-Sep-20,HAILEY_LEE,F,20-Dec-13,BANDERALO,SEXTONREGINALD@HOTMAIL.COM +24,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,02-Sep-20,MELISSA_LARSON,F,04-May-03,VILLA_MANZANO,BRYANTSHELBY@HOTMAIL.COM +25,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,02-Sep-20,TIFFANY_FIELDS,F,12-Jun-77,EL_PINO,FRENCHBRIAN@HOTMAIL.COM +26,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,02-Sep-20,TRACY_CRAWFORD,F,17-May-14,ARROYO_PAREJA,JOSEJACKSON@HOTMAIL.COM +27,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,03-Sep-20,JOANN_HOWELL,F,28-Mar-58,AGUSTONI,WONGCALEB@YAHOO.COM +28,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,03-Sep-20,LAUREN_FREDERICK,F,19-Apr-24,CARI_LARQUEA,COLTON79@YAHOO.COM +29,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,03-Sep-20,SANDRA_ARROYO,F,24-Mar-16,GENERAL_RODRIGUEZ,XJOHNSON@GMAIL.COM +30,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,03-Sep-20,CAROLINE_JAMES,F,31-May-64,ANDRADE,PHILLIPSSHIRLEY@HOTMAIL.COM +31,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,03-Sep-20,CHRISTINA_WILKINSON,F,07-Dec-39,12_DE_OCTUBRE,DUNLAPMARCUS@GMAIL.COM +32,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,03-Sep-20,AMY_SMITH,F,29-Oct-28,ACASSUSO,MARTINEZMICHAEL@HOTMAIL.COM +33,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,03-Sep-20,NICOLE_BRYAN,F,08-May-11,ISLA_VICTORIA,MMILLER@GMAIL.COM +34,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,03-Sep-20,CHRISTOPHER_JOHNSON,M,16-Mar-79,ESMERALDA,CONWAYWILLIAM@GMAIL.COM +35,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,03-Sep-20,KRISTEN_MICHAEL,F,23-May-48,EL_ARAZA,ROBERTNGUYEN@YAHOO.COM +36,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,03-Sep-20,MICHAEL_COLE,M,10-Jun-14,ARROYO_CORTO,THOMPSONJAMES@HOTMAIL.COM +37,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,03-Sep-20,ADRIAN_NGUYEN,M,14-Mar-15,ACERILLOS,EMILY62@GMAIL.COM +38,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,03-Sep-20,JAMES_ESPARZA,M,13-Jul-35,ARROYO_TOMAS,BENJAMIN89@HOTMAIL.COM +39,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,03-Sep-20,STEVEN_ROBINSON,M,22-Jun-11,ASERRADERO_ARROYO,IPHILLIPS@YAHOO.COM +40,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,04-Sep-20,JOYCE_FAULKNER,F,12-Mar-04,ARANA,MOORECHRISTOPHER@GMAIL.COM +41,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,04-Sep-20,DAWN_FLORES,F,10-Dec-11,EL_RETIRO,DEBBIE46@YAHOO.COM +42,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,04-Sep-20,KEVIN_KIM,M,30-Jun-25,ENCINA,MIRANDA39@YAHOO.COM +43,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,04-Sep-20,ERIC_FOSTER,M,21-Feb-38,LA_ROSA,CAROLYNREYES@HOTMAIL.COM +44,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,04-Sep-20,SHAUN_HARRIS,M,24-Jan-72,BIGAND,SMITHSTEPHANIE@GMAIL.COM +45,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,04-Sep-20,JONATHAN_MCCARTHY,M,27-Sep-12,EL_CAMOATI,SARAHMOONEY@HOTMAIL.COM +46,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,04-Sep-20,PAMELA_WILLIAMS,F,24-Jan-12,ADAN_QUIROGA,STEVENSONJACOB@YAHOO.COM +47,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,04-Sep-20,MICHAEL_BROWN,M,09-Oct-88,LLAVALLOL,DERRICK97@YAHOO.COM +48,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,04-Sep-20,MEGAN_SCHWARTZ,F,09-Sep-26,COLONIA_EL_POTRERO,SWANSONGREGORY@YAHOO.COM +49,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,04-Sep-20,KAREN_WILLIAMS,F,27-Jan-08,COLONIA_HERNANDARIAS,TERESA05@HOTMAIL.COM +50,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,04-Sep-20,JENNIFER_GREGORY_PHD,F,09-Oct-15,CUENCA,JOHNSONDENNIS@GMAIL.COM +51,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,04-Sep-20,JESSICA_BROWN,F,13-Jun-93,ARROYO_CASCO,RYANPORTER@GMAIL.COM +52,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,04-Sep-20,BRENDA_HURST,F,24-Aug-35,VILLANI,JUSTIN13@YAHOO.COM +53,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,04-Sep-20,STACEY_MEYER,F,23-Sep-79,LA_SARA,GANTHONY@YAHOO.COM +54,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,05-Sep-20,SAMUEL_PARKER,M,15-Jul-38,EL_TREBOL,QSIMS@GMAIL.COM +55,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,05-Sep-20,MASON_CARPENTER,M,22-Aug-34,AGUA_LINDA,PAUL92@GMAIL.COM +56,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,05-Sep-20,THOMAS_GILLESPIE,M,04-Jan-05,BAJO_GUAZU,GCRAWFORD@HOTMAIL.COM +57,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,05-Sep-20,KENNETH_SMITH,M,24-Dec-55,ALGARROBAL,MARVINFULLER@GMAIL.COM +58,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,05-Sep-20,MICHAEL_KELLY,M,18-Aug-25,RECALDE,HARRISJEREMY@YAHOO.COM +59,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,05-Sep-20,CAROLINE_MOORE,F,08-Apr-06,BARRIO_JARDIN_LUZURIAGA,JASONTHOMAS@HOTMAIL.COM +60,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,05-Sep-20,JAMES_BRADLEY,M,19-Dec-77,BOLIVAR,PORTERDANIELLE@HOTMAIL.COM +61,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,05-Sep-20,JASON_SWANSON,M,18-Dec-16,ESTACION_CORONEL_PRINGLES,CHRISTINE98@HOTMAIL.COM +62,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,05-Sep-20,RICHARD_VASQUEZ,M,05-Feb-17,ABRA_DEL_TAFI,DAVIDCOURTNEY@YAHOO.COM +63,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,05-Sep-20,LINDSEY_GREEN,F,20-Jan-20,VILLA_HIPODROMO,LROSALES@GMAIL.COM +64,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,05-Sep-20,TREVOR_JACKSON,M,23-Aug-25,CHACRAS_VIEJAS,ANGELA25@GMAIL.COM +65,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,05-Sep-20,ALLISON_ESTRADA,F,16-May-93,HALE,KELLY47@HOTMAIL.COM +66,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,06-Sep-20,SAMANTHA_HINTON,F,26-Apr-42,COLONIA_EL_AGUARA,KLEINCHRISTINA@HOTMAIL.COM +67,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,06-Sep-20,SAMUEL_WALLACE,M,24-Aug-14,CAMPO_CASTRO,OFERNANDEZ@YAHOO.COM +68,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,06-Sep-20,STACY_WEBB,F,20-Nov-29,CARACOLES,BRIANLEWIS@HOTMAIL.COM +69,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,06-Sep-20,DONNA_LANE,F,31-Jul-43,BERABEVU,GTHOMPSON@GMAIL.COM +70,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,06-Sep-20,RYAN_GARZA,M,12-Apr-56,COLONIA_LOS_TRES_USARIS,MICHAEL47@YAHOO.COM +71,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,06-Sep-20,KIMBERLY_CARDENAS,F,22-May-11,EL_GUALICHO,XCOPELAND@YAHOO.COM +72,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,06-Sep-20,JACQUELINE_ADAMS,F,06-Jan-93,ASAMBLEA,DOUGLASROMERO@HOTMAIL.COM +73,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,06-Sep-20,KAREN_WILSON,F,09-Mar-27,ESTEBAN_DE_LUCA,KRISTINE32@GMAIL.COM +74,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,06-Sep-20,SHARON_DONALDSON,F,16-Aug-81,ADELA,SCASTILLO@HOTMAIL.COM +75,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,06-Sep-20,STEVEN_ROMERO,M,30-Jun-56,LIBANO,ANDERSONDEBRA@YAHOO.COM +76,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,06-Sep-20,LISA_SWANSON,F,02-Mar-09,LA_BUANA_MOZA,MRIVERA@GMAIL.COM +77,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,06-Sep-20,JENNA_WILSON,F,17-Jan-60,CATARATAS_DEL_IGUAZU,SARAHHARRIS@HOTMAIL.COM +78,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,06-Sep-20,MATTHEW_GRIFFIN,M,02-Jun-64,BUSTAMANTE,DIAZERIC@YAHOO.COM +79,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,07-Sep-20,JOSEPH_MEADOWS,M,14-Oct-31,EZPELETA_ESTE,SARA20@GMAIL.COM +80,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,07-Sep-20,STEPHANIE_HART,F,21-Sep-42,ARISTIDES_VILLANUEVA,PATELSAMUEL@YAHOO.COM +81,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,07-Sep-20,JAMES_ROBINSON,M,14-Oct-02,ARANGUREN,ROBINSONPAMELA@YAHOO.COM +82,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,07-Sep-20,CAROLYN_WATSON,F,02-May-58,SAN_ANDRES,GRIFFINMATTHEW@HOTMAIL.COM +83,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,07-Sep-20,RALPH_JONES,M,21-Oct-05,CAPDEPONT,HENSONTRACY@YAHOO.COM +84,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,07-Sep-20,JOHN_KING,M,04-Feb-46,KILOMETRO_125,RICHARDMARTINEZ@HOTMAIL.COM +85,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,07-Sep-20,JULIE_GARCIA,F,16-Jan-13,CORTINES,BASSERIK@GMAIL.COM +86,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,07-Sep-20,THOMAS_WOOD,M,14-Jan-81,CERRILLOS_AL_SUD,CYNTHIAWOLF@HOTMAIL.COM +87,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,07-Sep-20,THOMAS_FLORES,M,03-Dec-18,COLONIA_EL_SIMBOL,RPHILLIPS@GMAIL.COM +88,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,07-Sep-20,CARLOS_RICHARDS,M,09-Jun-87,ARRIBEÑOS,BRITTANY00@GMAIL.COM +89,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,07-Sep-20,KEVIN_FREEMAN,M,14-Jul-24,LA_PORTEÑA,MONICAMAYO@HOTMAIL.COM +90,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,08-Sep-20,ROBERT_CLARK,M,29-Nov-01,LA_FLORENCIA,ANTHONY05@HOTMAIL.COM +91,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,08-Sep-20,TRACY_CASTILLO_MD,M,07-Apr-56,3_DE_MAYO,JAMESANDRADE@GMAIL.COM +92,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,08-Sep-20,SHARON_SHEPARD,F,23-Sep-10,VILLARS,TAYLORJAMES@YAHOO.COM +93,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,08-Sep-20,CHERYL_SCHROEDER,F,26-Nov-54,CAPILLA_DEL_SEÑOR,EMACDONALD@YAHOO.COM +94,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,08-Sep-20,JESSE_BALDWIN,M,21-Oct-57,COLONIA_ZAPATA,SNYDERBRIAN@HOTMAIL.COM +95,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,08-Sep-20,OLIVIA_PETERSON,F,07-Feb-16,CAMPO_MONTE_LA_VIRUELA,BRIANARILEY@HOTMAIL.COM +96,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,08-Sep-20,ALAN_ONEILL,M,12-Dec-68,AERO_CLUB_ROSARIO,EGLOVER@HOTMAIL.COM +97,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,08-Sep-20,TAYLOR_BURNS,M,01-May-04,ALTAMIRANO,MIGUELWHITE@HOTMAIL.COM +98,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,08-Sep-20,XAVIER_MILLER,M,25-Mar-85,20_DE_SEPTIEMBRE,JEREMYRHODES@YAHOO.COM +99,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,09-Sep-20,RACHEL_GAMBLE,F,17-Sep-84,ATREUCO,REGINAFRANKLIN@HOTMAIL.COM +100,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,09-Sep-20,SEAN_MOORE,M,20-Oct-60,VILLARS,THOMASOLIVIA@YAHOO.COM +101,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,09-Sep-20,THOMAS_DAY,M,07-Nov-48,BAIGORRITA,MAXWILLIAMS@GMAIL.COM +102,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,09-Sep-20,BRANDI_PATTERSON,F,02-Jul-49,ARAÑITA,PATRICKWRIGHT@HOTMAIL.COM +103,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,09-Sep-20,GREGORY_JOHNSON,M,22-May-68,PAGANCILLO,CARRIEJOHNSON@GMAIL.COM +104,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,09-Sep-20,JONATHAN_JONES,M,13-Jun-17,BALDES_DE_PACHECO,WALTERCOMBS@YAHOO.COM +105,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,09-Sep-20,KIMBERLY_GONZALEZ,F,24-Jun-92,AVESTRUZ,SCHMIDTMARIA@HOTMAIL.COM +106,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,09-Sep-20,TODD_TUCKER,M,17-Jun-46,AGUA_DE_DIONISIO,MICHAEL85@HOTMAIL.COM +107,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,09-Sep-20,TIMOTHY_THOMAS,M,04-Jul-75,IFRAN,AFISHER@HOTMAIL.COM +108,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,09-Sep-20,ADAM_BROWN,M,23-Feb-05,ALTO_DE_LA_LEÑA,UMYERS@YAHOO.COM +109,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,09-Sep-20,RICKY_MEYER,M,08-Feb-63,COMANDANTE_GIRIBONE,GORDON94@HOTMAIL.COM +110,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,09-Sep-20,MELISSA_WALKER,F,18-Apr-30,SAN_GENARO_NORTE,MWARD@GMAIL.COM +111,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,09-Sep-20,DEBRA_FOWLER,F,08-Jun-31,ALAMO,AARONSMITH@HOTMAIL.COM +112,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,09-Sep-20,MITCHELL_ELLISON,M,25-Feb-22,CARAGUATAY,FGIBSON@HOTMAIL.COM +113,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,09-Sep-20,HEATHER_WASHINGTON,F,03-Oct-32,CABI_MONDA,CAMPBELLJAMES@HOTMAIL.COM +114,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,09-Sep-20,SHEILA_WONG,F,23-Mar-86,20_DE_SEPTIEMBRE,SMARTIN@GMAIL.COM +115,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,09-Sep-20,ANNA_MARTINEZ,F,21-Nov-60,ARROYO_ISABEL,LDUNN@GMAIL.COM +116,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,09-Sep-20,KATHERINE_MEDINA,F,17-Sep-26,CAMPO_CASTRO,REGINALD04@HOTMAIL.COM +117,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,10-Sep-20,LATASHA_SMITH,F,16-Dec-56,DON_TORCUATO,BRETT19@HOTMAIL.COM +118,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,10-Sep-20,ERICA_BAILEY,F,23-Oct-11,CONCEPCION_DEL_BERMEJO,TAMI08@HOTMAIL.COM +119,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,10-Sep-20,JOSHUA_PALMER,M,07-Jan-87,LA_PORTEÑA,MARK21@HOTMAIL.COM +120,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,10-Sep-20,JOHN_ONEAL,M,06-Feb-13,BATIRUANA,JOHN08@GMAIL.COM +121,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,10-Sep-20,JESSICA_WILLIAMS,F,16-Oct-08,BOUQUET,WAGNERMARIA@YAHOO.COM +122,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,10-Sep-20,JONATHAN_KENNEDY,M,20-Dec-33,ABRALAITE,JAMESJACKSON@HOTMAIL.COM +123,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,10-Sep-20,JONATHAN_LAM,M,06-Aug-28,BOCAS,LATOYAGOULD@GMAIL.COM +124,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,10-Sep-20,TAMMY_SANCHEZ,F,27-Apr-86,SIERRA_DE_LA_VENTANA,SAMANTHAGIBSON@HOTMAIL.COM +125,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,10-Sep-20,JUSTIN_WARD,M,15-Aug-51,CASCADA,HEATHER47@YAHOO.COM +126,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,10-Sep-20,JANET_JENKINS,F,21-Jul-12,BARRANCAS_COLORADAS,PATRICK54@GMAIL.COM +127,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,10-Sep-20,CHRISTINE_CONNER_MD,F,25-Jul-36,CAÑADA_SECA,JUSTINBROWN@YAHOO.COM +128,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,10-Sep-20,RONALD_KENNEDY,M,28-Apr-06,MORON,KHANLISA@GMAIL.COM +129,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,11-Sep-20,VERONICA_WHITE,F,10-Nov-08,ALTONA,HENDERSONMEGAN@HOTMAIL.COM +130,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,11-Sep-20,ANA_GRAVES,F,26-Aug-12,BAJO_GUAZU,ROSALESCLAUDIA@GMAIL.COM +131,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,11-Sep-20,MICHAEL_SCOTT,M,11-Sep-01,BENITO_JUAREZ,WILLIAMSONSARAH@YAHOO.COM +132,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,11-Sep-20,BRYCE_NAVARRO,M,02-Apr-70,ASCENCION,BROWNSYDNEY@HOTMAIL.COM +133,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,11-Sep-20,TAYLOR_WILLIAMS,M,13-May-60,CUARTEL_V,NWALLS@HOTMAIL.COM +134,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,11-Sep-20,ANGEL_MOSLEY,F,31-Oct-24,CAÑADA_DE_LAS_VACAS,ANDREWMARTIN@YAHOO.COM +135,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,11-Sep-20,WILLIE_SOLIS,M,04-Mar-19,ESC_NAV_MILITAR_RIO_SANT,AARON89@HOTMAIL.COM +136,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,11-Sep-20,DAVID_THOMPSON,M,14-Aug-04,ALEGRIA,BRIANSTANTON@HOTMAIL.COM +137,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,11-Sep-20,JIM_COX,M,20-Jun-71,CAA_YARI,OLIVEREVELYN@YAHOO.COM +138,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,11-Sep-20,DIANE_WARREN,F,24-Oct-09,CABURE,HEDWARDS@YAHOO.COM +139,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,11-Sep-20,JULIE_THOMPSON,F,06-Apr-92,EL_REMANSO,THOMAS62@GMAIL.COM +140,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,12-Sep-20,KRISTOPHER_WILKINS,M,09-Sep-58,CARRIZAL_NORTE,HUGHESRACHEL@YAHOO.COM +141,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,12-Sep-20,TINA_HILL,F,20-Feb-32,BARRIO_1_DE_MAYO,WILLIAMSONWILLIAM@YAHOO.COM +142,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,12-Sep-20,ELIZABETH_FLETCHER,F,16-Apr-28,COLONIA_MABRAGAÑA,RCLARK@YAHOO.COM +143,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,12-Sep-20,MIGUEL_WILLIAMS,M,01-Aug-83,INGENIO_LA_PROVIDENCIA,CCARTER@YAHOO.COM +144,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,12-Sep-20,MATTHEW_CONLEY,M,08-Oct-42,EL_ARAZA,WATSONMELISSA@HOTMAIL.COM +145,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,12-Sep-20,STEVEN_BOWMAN,M,24-Feb-49,ACONQUIJA,YKIM@GMAIL.COM +146,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,12-Sep-20,GEORGE_WASHINGTON,M,06-Apr-65,MECHA,TTAYLOR@YAHOO.COM +147,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,12-Sep-20,NATASHA_EDWARDS,F,02-Apr-77,ARROYO_LAS_MINAS,ADAMRAMIREZ@GMAIL.COM +148,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,13-Sep-20,MARCUS_PAYNE,M,11-Dec-15,APEADERO_LAS_CHIMBAS,ERICSULLIVAN@YAHOO.COM +149,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,13-Sep-20,YOLANDA_HARRIS,F,30-Jun-34,ALEJANDRA,BRENDAHODGES@YAHOO.COM +150,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,13-Sep-20,APRIL_JOYCE,F,05-Nov-35,CHOVET,SANDRA83@YAHOO.COM +151,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,13-Sep-20,JESSICA_VEGA,F,15-Feb-49,LUIS_CHICO,VWASHINGTON@HOTMAIL.COM +152,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,13-Sep-20,JASON_SHEA,M,01-Jun-42,ARROYO_HONDO,RONALDDEAN@GMAIL.COM +153,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,13-Sep-20,FRANK_WEAVER,M,18-Apr-06,INGENIERO_BALBIN,VICKIEWOOD@YAHOO.COM +154,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,13-Sep-20,MICHELE_TUCKER,F,11-Dec-98,BALDES_DE_PACHECO,ADAVIS@YAHOO.COM +155,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,14-Sep-20,ANDREW_LE,M,03-Sep-67,ARAÑITA,DOROTHY42@YAHOO.COM +156,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,14-Sep-20,JACOB_GOODWIN,M,09-May-96,COSTA_BONITA_BALNEARIO,TIMOTHY92@GMAIL.COM +157,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,14-Sep-20,MICHAEL_MUNOZ,M,29-Mar-68,ACHALCO,WHITNEY22@YAHOO.COM +158,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,14-Sep-20,KIMBERLY_FLOYD,F,03-Aug-16,ALBARDON,PAULBURCH@GMAIL.COM +159,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,14-Sep-20,TERRI_ONEAL,F,07-Jul-11,KILOMETRO_47,WANDAMILLER@GMAIL.COM +160,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,14-Sep-20,JULIE_MURRAY,F,08-Jun-22,INGENIERO_WILLIAMS,SWILSON@YAHOO.COM +161,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,14-Sep-20,NICHOLAS_ALVAREZ,M,07-Jul-43,COLONIA_GOBERNADOR_AYALA,SARAH42@YAHOO.COM +162,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,14-Sep-20,COLLIN_STEWART,M,09-Dec-08,POZO_NAVAGAN,CASSIEJOHNSON@GMAIL.COM +163,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,14-Sep-20,WILLIAM_BELL,M,16-Aug-75,JUAN_VELA,NICOLE13@HOTMAIL.COM +164,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,14-Sep-20,CHARLES_HAYDEN,M,16-Nov-66,ALEGRIA,JODY40@YAHOO.COM +165,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,14-Sep-20,TIFFANY_BROWN,F,01-Oct-03,16_DE_JULIO,CHARLESJAMES@GMAIL.COM +166,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,14-Sep-20,JOHN_WELLS,M,03-Jan-64,BUEN_PASTO,JASON46@GMAIL.COM +167,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,15-Sep-20,HEATHER_THOMAS,F,20-Mar-13,AGUAS_CALIENTES,JOSEPHCOLEMAN@YAHOO.COM +168,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,15-Sep-20,ERICA_PEREZ,F,27-Oct-82,EMPALME,HRICHARDSON@HOTMAIL.COM +169,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,15-Sep-20,PETER_DUNN,M,26-Mar-86,LOS_MOLINOS,NGARRETT@YAHOO.COM +170,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,15-Sep-20,BECKY_MCKEE,F,28-Mar-97,ARMSTRONG,ANTHONYLOPEZ@HOTMAIL.COM +171,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,15-Sep-20,TIMOTHY_BROWN,M,21-Sep-52,BARRANQUERAS,LOGAN69@GMAIL.COM +172,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,15-Sep-20,KIM_CARTER,F,12-Mar-20,CARLOS_PELLEGRINI,JOSEPHGILL@HOTMAIL.COM +173,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,15-Sep-20,JASON_FISHER,M,27-Mar-07,BAJO_LAS_TUNAS,STOUTLARRY@HOTMAIL.COM +174,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,15-Sep-20,LAURA_MAHONEY,F,21-May-48,ARROYO_DULCE,YBRAUN@YAHOO.COM +175,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,15-Sep-20,ANDREW_OSBORNE,M,12-Feb-89,ATALIVA,HMCCLAIN@YAHOO.COM +176,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,15-Sep-20,CHRISTOPHER_BASS,M,29-Sep-84,COPACABANA,JERRYHESS@YAHOO.COM +177,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,15-Sep-20,RENEE_COX,F,26-Aug-21,ANTONIO_TOMAS,RBAKER@HOTMAIL.COM +178,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,15-Sep-20,ANNA_CLARK,F,17-Dec-49,LA_FLORENCIA,SMITHBRIAN@GMAIL.COM +179,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,15-Sep-20,PENNY_HUANG,F,23-Nov-88,CAMPO_SALUSSO,ROBERT89@HOTMAIL.COM +180,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,15-Sep-20,SYDNEY_ENGLISH,F,25-Feb-48,ESMERALDA,JERRYARMSTRONG@YAHOO.COM +181,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,15-Sep-20,ROBERT_JOHNSON,M,01-Jun-74,JUAN_VELA,BROWNJANE@YAHOO.COM +182,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,15-Sep-20,JAMES_SINGH,M,20-Dec-17,ALASTUEY,PCOOPER@GMAIL.COM +183,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,15-Sep-20,BRANDON_THOMPSON,M,26-Mar-38,AGUA_DE_LOS_MANANTIALES,FARROYO@HOTMAIL.COM +184,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,16-Sep-20,KATHERINE_BAKER,F,27-Dec-19,PASO_TELEGRAFO,ANGELASMITH@GMAIL.COM +185,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,16-Sep-20,REBECCA_JOHNSON_MD,F,11-Oct-68,FRANCISCO_CASAL,JENNA90@YAHOO.COM +186,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,16-Sep-20,JACOB_NORRIS,M,26-Jan-62,BELLOCQ,NICOLENELSON@YAHOO.COM +187,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,16-Sep-20,YVONNE_FISHER,F,20-Sep-43,BOQUERON,PARKERANDREW@YAHOO.COM +188,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,16-Sep-20,KIM_TAYLOR,F,30-Aug-81,COLONIA_JOSEFA,TRACIROMERO@GMAIL.COM +189,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,16-Sep-20,JACQUELINE_HERNANDEZ,F,19-Aug-19,ARROYO_MAGDALENA,DANNYMARTIN@YAHOO.COM +190,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,16-Sep-20,JOHN_OLIVER,M,28-Nov-96,FRANCISCO_MADERO,KEVINPEREZ@HOTMAIL.COM +191,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,16-Sep-20,GLORIA_COOPER,F,21-Feb-08,LA_COLINA,HANDERSON@GMAIL.COM +192,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,16-Sep-20,CHRISTINA_PARSONS,F,22-Jan-50,VILLA_ANGELICA,PAMELALAWSON@YAHOO.COM +193,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,16-Sep-20,DUSTIN_BURTON,M,24-Jan-14,CAMINERA_LUJAN,ELIZABETH75@GMAIL.COM +194,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,16-Sep-20,TAMMY_BRYANT,F,28-Nov-69,GENTE_GRANDE,BRADSHAWCOURTNEY@GMAIL.COM +195,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,16-Sep-20,JAMES_BARRETT,M,19-Jun-41,AGUA_DEL_SIMBOL,HOGANKARL@HOTMAIL.COM +196,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,16-Sep-20,MICHAEL_MEYER,M,19-Mar-67,MARTIN_CORONADO,ALYSSASTAFFORD@YAHOO.COM +197,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,16-Sep-20,JENNIFER_COLLINS,F,08-Aug-11,COLONIA_FALCO,WMORROW@HOTMAIL.COM +198,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,17-Sep-20,ANTHONY_MILLER,M,27-Jun-83,12_DE_OCTUBRE,EJENNINGS@YAHOO.COM +199,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,17-Sep-20,JENNIFER_JIMENEZ,F,21-Nov-95,CORA,TBAILEY@YAHOO.COM +200,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,17-Sep-20,NICHOLAS_CASE,M,22-Jul-67,LA_DULCE,XNORRIS@GMAIL.COM +201,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,17-Sep-20,SAMUEL_BROOKS,M,18-Oct-87,TEMPERLEY,HANNAHWILLIAMS@GMAIL.COM +202,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,17-Sep-20,LORI_ROBERTS,F,14-Jan-02,INDACOCHEA,MURRAYDORIS@HOTMAIL.COM +203,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,17-Sep-20,JOSHUA_FRIEDMAN,M,11-Jan-69,JOSE_CLEMENTE_PAZ,VSMITH@HOTMAIL.COM +204,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,17-Sep-20,DAVID_EVANS,M,13-Jul-70,LOS_ANTIGUOS,DAVIDFLORES@YAHOO.COM +205,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,17-Sep-20,JESSICA_GREEN,F,12-Aug-10,ASTURIAS,HCRAWFORD@YAHOO.COM +206,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,17-Sep-20,GABRIELA_WEISS,F,04-Nov-93,NORDELTA,STONECATHERINE@YAHOO.COM +207,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,17-Sep-20,JAMES_GONZALEZ,M,08-Mar-42,CORONEL_ISLEÑOS,JOSEPHJACKSON@HOTMAIL.COM +208,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,17-Sep-20,TAYLOR_SAUNDERS,F,13-Nov-61,FORTIN_IRENE,AMANDA64@YAHOO.COM +209,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,17-Sep-20,RAYMOND_WILKINSON,M,04-Nov-55,ALDEA_SAN_ANDRES,CHRISTOPHER41@HOTMAIL.COM +210,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,17-Sep-20,BRANDON_KELLER,M,23-Nov-81,COLONIA_NUEVA_MONTEVIDEO,MASONMATTHEW@GMAIL.COM +211,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,17-Sep-20,KATHY_SOTO,F,30-Jan-39,COLONIA_BARON_HIRSCH,RANDALLROGERS@YAHOO.COM +212,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,17-Sep-20,ANDREA_JACKSON,F,13-Feb-99,ARROYO_DEL_CURA,ROBERTSJOSE@HOTMAIL.COM +213,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,18-Sep-20,TRISTAN_GONZALES,M,10-Dec-73,RICARDO_LAVALLE,NATASHARODRIGUEZ@GMAIL.COM +214,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,18-Sep-20,EARL_MARTINEZ,M,14-Feb-11,ABRA_RICA,WILLIAM80@HOTMAIL.COM +215,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,18-Sep-20,BRENDA_BENSON,F,12-Oct-19,DOLORES,JEFF02@GMAIL.COM +216,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,18-Sep-20,BREANNA_WELLS,F,29-Jan-56,25_DE_MAYO,JOSEPHTHOMPSON@YAHOO.COM +217,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,18-Sep-20,MICHELLE_EVANS,F,29-Mar-14,25_DE_MAYO,PHUGHES@HOTMAIL.COM +218,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,18-Sep-20,JUSTIN_MILLER,M,31-Dec-85,BIGAND,MOLINAJAMES@HOTMAIL.COM +219,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,18-Sep-20,DAVID_MICHAEL,M,15-Jan-60,LIBANO,FOSTERJAMES@GMAIL.COM +220,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,18-Sep-20,TANYA_MAYNARD,F,29-Jun-69,CHAVARRIA,WHITEJOEL@YAHOO.COM +221,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,18-Sep-20,STANLEY_THOMAS,M,14-Apr-06,ALGARROBO,SANCHEZNICHOLAS@YAHOO.COM +222,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,18-Sep-20,JACQUELINE_LYNCH,F,05-Feb-54,BIGAND,KEITH17@GMAIL.COM +223,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,18-Sep-20,LORI_SANCHEZ,F,03-Oct-24,ACEILAN,GBROWN@GMAIL.COM +224,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,18-Sep-20,GREGORY_PATEL,M,21-Mar-49,EL_CHALTEN,ROBERTMATTHEWS@YAHOO.COM +225,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,18-Sep-20,WILLIAM_ROLLINS,M,03-Jun-80,ANTIGUYOS,ARIASPATRICIA@HOTMAIL.COM +226,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,18-Sep-20,MELISSA_CHRISTIAN,F,12-Feb-55,ALMACEN_CASTRO,SMITHJEFFREY@HOTMAIL.COM +227,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,18-Sep-20,JEREMIAH_HERNANDEZ,M,15-Dec-92,INDIO_RICO,WILLIAM27@GMAIL.COM +228,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,18-Sep-20,DEBRA_ZHANG,F,16-Oct-84,AGUA_DE_LA_MULA,JENNIFER21@YAHOO.COM +229,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,18-Sep-20,HEATHER_DAVIDSON,F,08-Jul-05,AGRELO,THUANG@YAHOO.COM +230,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,19-Sep-20,RICHARD_REESE,M,10-Dec-71,AGUADITAS,SAWYERKIMBERLY@HOTMAIL.COM +231,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,19-Sep-20,JOSE_JACKSON,M,13-Mar-82,AGRELO,MIGUELMORGAN@YAHOO.COM +232,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,19-Sep-20,MELISSA_RODRIGUEZ,F,02-Nov-17,CACHIYUYAL,DARLENEHENRY@GMAIL.COM +233,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,19-Sep-20,SARAH_GALLAGHER,F,26-Aug-14,AYUI_PARADA,EDWARDHENDRICKS@HOTMAIL.COM +234,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,19-Sep-20,JAMES_THOMAS,M,11-Apr-46,SAN_JOSE,LYNCHSCOTT@YAHOO.COM +235,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,19-Sep-20,MATTHEW_BASS,M,07-Nov-60,DIEGO_LOPEZ,JEFFREYMANNING@YAHOO.COM +236,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,19-Sep-20,JAMES_CARTER,M,18-Dec-92,AYACUCHO,PVALDEZ@HOTMAIL.COM +237,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,19-Sep-20,STEPHANIE_HAYS,F,13-Oct-29,RAFAEL_CASTILLO,SAWYERROBIN@HOTMAIL.COM +238,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,19-Sep-20,MICHAEL_PETERSON,M,14-May-18,BANDERALO,ANDREWBARTON@YAHOO.COM +239,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,19-Sep-20,TARA_POWELL,F,13-Jul-38,GANDOLFI,CHELSEA78@HOTMAIL.COM +240,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,20-Sep-20,GEOFFREY_SHEA,M,13-Jan-90,BARROS_PAZOS,MILLERMONICA@GMAIL.COM +241,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,20-Sep-20,ERIK_PATTERSON,M,16-Nov-05,BOQUERON,FISHERPHILLIP@HOTMAIL.COM +242,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,20-Sep-20,JAMES_SHIELDS,M,24-Mar-49,LOS_INDIOS,NPROCTOR@HOTMAIL.COM +243,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,20-Sep-20,MARK_SHAW,M,14-Sep-08,COLONIA_JAPONESA,ERIN47@YAHOO.COM +244,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,20-Sep-20,JORGE_GOMEZ,M,06-May-29,ESTACION_USPALLATA,BARBARAMARTINEZ@HOTMAIL.COM +245,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,20-Sep-20,JOSEPH_FRANKLIN,M,20-Jan-72,AERO_CLUB_ROSARIO,MICHELLEPRESTON@YAHOO.COM +246,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,20-Sep-20,JUSTIN_PACHECO,M,24-Jun-79,ALBARRACIN,WILSONJENNIFER@GMAIL.COM +247,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,20-Sep-20,SHAWNA_WATKINS,F,12-Mar-80,BONPLAND,JESSESTEVENSON@HOTMAIL.COM +248,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,20-Sep-20,CHRISTOPHER_GARCIA,M,12-Aug-23,COLONIA_JAUREGUI,DONNA62@YAHOO.COM +249,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,20-Sep-20,ELIZABETH_MORENO,F,28-Jun-06,AGUA_DE_LA_ZORRA,TAYLORLORI@YAHOO.COM +250,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,20-Sep-20,MICHAEL_VASQUEZ,M,08-Apr-11,ALIJILAN,JAMESRAY@YAHOO.COM +251,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,20-Sep-20,JAMES_CAMPBELL,M,08-Jul-56,LA_PLATA,NBURCH@GMAIL.COM +252,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,20-Sep-20,DEBORAH_REID,F,11-Jul-35,COLIQUEO,XGRIFFIN@GMAIL.COM +253,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,20-Sep-20,MICHAEL_GRIFFIN,M,12-Sep-93,CARI_LARQUEA,SBRADY@HOTMAIL.COM +254,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,20-Sep-20,JOHN_JOHNSON,M,15-Jan-19,COLONIA_FREITAS,BTAYLOR@YAHOO.COM +255,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,20-Sep-20,EDWIN_JACKSON,M,11-Oct-05,CENTINELA,ANDERSONNATALIE@HOTMAIL.COM +256,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,20-Sep-20,DR._KATHRYN_TURNER,F,16-Nov-84,AGUADA_A_PIQUE,DVILLEGAS@YAHOO.COM +257,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,20-Sep-20,JENNIFER_HAWKINS,F,13-May-94,TEMPERLEY,MARY45@GMAIL.COM +258,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,20-Sep-20,KELLY_TAYLOR,F,14-Dec-94,MANUEL_OCAMPO,RANDALLWEBER@GMAIL.COM +259,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,20-Sep-20,MALLORY_VILLARREAL,F,26-Jan-81,AGUARA_CUA,PORTERDAVE@YAHOO.COM +260,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,21-Sep-20,BRIAN_MORRISON,M,25-Nov-43,ALTO_DE_LA_LEÑA,PATRICK64@GMAIL.COM +261,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,21-Sep-20,ELIZABETH_NAVARRO,F,02-Nov-78,COLONIA_AROCENA_INA,DWEST@HOTMAIL.COM +262,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,21-Sep-20,ELIJAH_ONEILL,M,17-Apr-46,12_DE_OCTUBRE,LOGANROBERTSON@GMAIL.COM +263,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,21-Sep-20,JASON_JOHNSON,M,26-Dec-69,LEUBUCO,STEVEN06@GMAIL.COM +264,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,21-Sep-20,NICOLE_TYLER,F,01-Dec-24,BENAVIDEZ,AMYCONTRERAS@GMAIL.COM +265,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,21-Sep-20,CHEYENNE_SOLOMON,F,27-Nov-08,MARIA_MAGDALENA,ZRAMIREZ@GMAIL.COM +266,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,21-Sep-20,HECTOR_SHERMAN,M,14-Jun-43,COLONIA_JAPONESA,EBAILEY@YAHOO.COM +267,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,21-Sep-20,JAMES_HARVEY_DDS,M,28-Jan-50,BAIGORRITA,FERGUSONBRANDON@HOTMAIL.COM +268,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,21-Sep-20,KIMBERLY_LANE,F,07-Apr-45,CEVIL_GRANDE,DICKERSONJAMES@HOTMAIL.COM +269,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,21-Sep-20,JESSICA_ADAMS,F,16-Sep-39,AGUA_DE_DIONISIO,ERICMONROE@HOTMAIL.COM +270,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,21-Sep-20,MARIA_EVANS,F,05-Nov-89,LA_CALIFORNIA,JENNIFER35@HOTMAIL.COM +271,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,22-Sep-20,MICHELLE_WALSH,F,22-Sep-73,ARROYO_CORTO,JESSICANEWMAN@HOTMAIL.COM +272,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,22-Sep-20,RUSSELL_ROBERTS,M,11-Dec-16,ALTO_LINDO,DEBRA58@GMAIL.COM +273,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,22-Sep-20,SHERRI_THOMAS,F,24-Jan-11,CORRALITO,MARKLYNCH@GMAIL.COM +274,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,22-Sep-20,JESSICA_JAMES,F,11-Nov-15,CARCARAÑA,VINCENTJOEL@YAHOO.COM +275,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,22-Sep-20,KRISTIN_BAXTER,F,12-Feb-83,CASABLANCA,QHANSON@GMAIL.COM +276,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,23-Sep-20,ELIJAH_MURPHY,M,29-Sep-63,ARROYO_URQUIZA,DMILLER@HOTMAIL.COM +277,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,23-Sep-20,MICHAEL_WILLIAMS,M,10-May-96,16_DE_JULIO,IHICKMAN@GMAIL.COM +278,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,23-Sep-20,JOHN_OWENS,M,18-Sep-20,CAMPO_DE_LOS_ANDES,ECHRISTIAN@HOTMAIL.COM +279,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,23-Sep-20,BETHANY_MCCALL,F,27-Dec-88,AGUA_AMARGA,HOWARDDENISE@YAHOO.COM +280,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,23-Sep-20,BENJAMIN_PARKER,M,12-Apr-53,GOBERNADOR_MOYANO,DOMINGUEZKRISTINA@GMAIL.COM +281,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,23-Sep-20,TAMARA_CARRILLO,F,10-Jun-23,CAÑADON_DE_LOS_INDIOS,KYOUNG@HOTMAIL.COM +282,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,23-Sep-20,LISA_MALONE,F,30-Aug-92,BAJO_DE_LOS_HUESOS,ZBROWN@HOTMAIL.COM +283,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,23-Sep-20,GREGORY_COLLINS,M,31-Jul-95,INGENIO_LA_PROVIDENCIA,HALEYKEVIN@HOTMAIL.COM +284,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,23-Sep-20,TRACY_MILLER,F,15-Oct-24,CAMPO_DEL_NORTE_AMERICANO,CHRISTINEMCCOY@YAHOO.COM +285,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,23-Sep-20,JANET_GOMEZ_DDS,F,04-Sep-51,AMERICA_UNIDA,CHERYL42@YAHOO.COM +286,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,23-Sep-20,KAREN_MOORE,F,07-Oct-07,ARATA,ZSMITH@HOTMAIL.COM +287,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,23-Sep-20,MARTIN_COBB,M,22-Aug-57,LA_PUNTA,REBECCAGORDON@HOTMAIL.COM +288,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,23-Sep-20,WILLIAM_FOWLER,M,05-Mar-09,CARAGUATAY,GEORGEMILES@HOTMAIL.COM +289,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,23-Sep-20,MICHAEL_ORTEGA,M,16-Jun-32,CARAPACHAY,WRIGHTLISA@HOTMAIL.COM +290,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,23-Sep-20,RODNEY_WILKERSON,M,21-Sep-31,CABURE,JOHNCANNON@GMAIL.COM +291,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,24-Sep-20,TARA_MCGEE,F,20-Jul-13,EL_REMANSO,GGARCIA@YAHOO.COM +292,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,24-Sep-20,KEVIN_AUSTIN,M,27-Feb-21,ALBARDON,EVAN49@GMAIL.COM +293,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,24-Sep-20,DEANNA_SANCHEZ,F,16-Oct-19,COLONIA_MONTE_LA_PLATA,QMARTINEZ@GMAIL.COM +294,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,24-Sep-20,JEFFREY_MILLER,M,11-Feb-32,PAZOS_KANKI,RACHEL07@YAHOO.COM +295,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,24-Sep-20,GINA_THOMAS,F,29-Jun-65,CIUDAD_MADERO,ROGERSMATTHEW@GMAIL.COM +296,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,24-Sep-20,BRENT_WEEKS,M,16-Nov-75,LA_TRANCA,DEBBIEAYALA@YAHOO.COM +297,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,24-Sep-20,RICKEY_GRIFFITH,M,14-Nov-86,ANECON_CHICO,KMAY@YAHOO.COM +298,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,24-Sep-20,ANDREA_REID,F,26-Jan-76,JOSE_FERRARI,JOHNRICHARDS@GMAIL.COM +299,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,24-Sep-20,KARL_KELLY,M,03-Apr-98,VALENTIN_ALSINA,GARYMOORE@GMAIL.COM +300,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,24-Sep-20,VICKIE_WILLIAMS,F,11-Jul-17,CORONEL_GRANADA,MEGANFERGUSON@GMAIL.COM +301,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,24-Sep-20,KIMBERLY_DAVILA,F,13-Feb-55,CAPITAN_SOLARI,WILLIAMSKARA@HOTMAIL.COM +302,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,24-Sep-20,KEVIN_BURTON,M,02-Nov-24,CAMPO_COLIQUEO,OWOLFE@HOTMAIL.COM +303,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,24-Sep-20,JAMES_BURNS,M,18-Jan-53,ARMINDA,WALVARADO@YAHOO.COM +304,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,24-Sep-20,GRACE_VELASQUEZ,F,24-Nov-83,AGUARA_CUA,GALLEGOSJIM@YAHOO.COM +305,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,24-Sep-20,FRANCIS_GLOVER,M,02-Apr-40,CASIMIRO_GOMEZ,MOORESTEVEN@YAHOO.COM +306,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,24-Sep-20,CHRISTINE_REED,F,20-Jul-00,ALABAMA,NANCY29@YAHOO.COM +307,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,24-Sep-20,ROBERT_WEAVER,M,13-Jun-65,ALEGRIA,RILEYKAREN@HOTMAIL.COM +308,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,24-Sep-20,RYAN_LANDRY,M,19-May-21,VILLA_RUIZ,QPERKINS@HOTMAIL.COM +309,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,24-Sep-20,LEE_REED,M,02-Jul-58,BASE_AERONAVAL_PUNTA_INDIO,FRANK33@GMAIL.COM +310,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,25-Sep-20,WILLIAM_FRY,M,06-Nov-10,ARROYO_HONDO,REBECCA24@HOTMAIL.COM +311,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,25-Sep-20,TRACY_CAREY,F,06-Jan-06,CARMEN_DE_ARECO,ROMANLEE@GMAIL.COM +312,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,25-Sep-20,TIFFANY_STEVENS,F,25-Sep-50,EL_CARRETERO,URUSSELL@GMAIL.COM +313,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,25-Sep-20,REBECCA_JOHNSON,F,11-Apr-20,CAMPO_DE_LOS_TOROS,MARSHALLANTHONY@HOTMAIL.COM +314,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,25-Sep-20,JASMINE_JOHNSTON,F,16-Nov-61,ANTONIO_PINI,JENNIFER65@YAHOO.COM +315,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,25-Sep-20,JENNIFER_HUDSON,F,18-Apr-04,CALCHAQUI,ANDRE87@YAHOO.COM +316,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,25-Sep-20,IAN_GOODMAN,M,20-Mar-48,CAPILLA_DEL_SEÑOR,JESSICA98@YAHOO.COM +317,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,25-Sep-20,JOYCE_CAMPBELL,F,16-Jun-90,COLONIA_MORGAN,DIANEDOMINGUEZ@GMAIL.COM +318,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,25-Sep-20,CRAIG_MORGAN,M,11-Oct-13,JOSE_LEON_SUAREZ,JACQUELINE43@GMAIL.COM +319,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,25-Sep-20,KAREN_HAMILTON,F,26-Apr-04,LA_AGUADA_DE_LAS_ANIMAS,TIMOTHYBERRY@YAHOO.COM +320,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,25-Sep-20,JAMES_BRADLEY,M,29-Jan-16,VILLARS,MATTHEW74@YAHOO.COM +321,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,26-Sep-20,JAMES_ROY,M,28-Dec-52,CLAUDIO_C_MOLINA,JACOBSMITH@GMAIL.COM +322,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,26-Sep-20,DANIEL_MULLINS,M,08-Jan-34,CHOLILA,TROYCHARLES@HOTMAIL.COM +323,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,26-Sep-20,KELSEY_BROWN,F,08-Feb-60,LOMAS_DEL_RIO_LUJAN,AVILAJOSEPH@GMAIL.COM +324,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,26-Sep-20,CHARLES_ALVARADO,M,23-Jul-35,SAN_FRANCISCO_SOLANO,QPARSONS@GMAIL.COM +325,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,26-Sep-20,JESSICA_JOHNS,F,17-Feb-24,CAMPO_DE_LOS_TOROS,KMULLINS@HOTMAIL.COM +326,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,26-Sep-20,CAROL_MORTON,F,23-May-99,AGUILARES,LAWSONLESLIE@HOTMAIL.COM +327,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,26-Sep-20,TERESA_ROWLAND,F,21-Oct-13,FRANCISCO_CASAL,RMORGAN@HOTMAIL.COM +328,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,26-Sep-20,RACHEL_JACKSON,F,30-Mar-93,COLONIA_HANSEN,SARAGARDNER@HOTMAIL.COM +329,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,26-Sep-20,JOSHUA_RICHARDS,M,25-May-52,ARROYO_SALADO,OSHERMAN@GMAIL.COM +330,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,26-Sep-20,HOLLY_SANCHEZ,F,17-Jul-37,AMILGANCHO,PATRICK50@YAHOO.COM +331,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,26-Sep-20,VICTORIA_CRAWFORD,F,13-Nov-17,CAMPO_RAFFO,ANGELA58@YAHOO.COM +332,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,26-Sep-20,HEATHER_RICHARDSON,F,08-Jan-08,CAÑADON_LEON,PAMELAMAYER@GMAIL.COM +333,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,27-Sep-20,JESUS_ROWE,M,03-Jul-74,LA_PELADA,MCOOPER@HOTMAIL.COM +334,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,27-Sep-20,CHRISTIAN_ROSS,M,03-Apr-78,RAFAEL_CALZADA,TRACIE62@YAHOO.COM +335,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,27-Sep-20,JOSEPH_BALDWIN,M,04-Feb-74,VALLE_HONDO,HARRINGTONJORDAN@HOTMAIL.COM +336,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,27-Sep-20,CYNTHIA_LEE,F,08-Dec-79,BARRIO_VILLA_SALADILLO,CASTROJAMIE@YAHOO.COM +337,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,27-Sep-20,DAVID_GARCIA,M,19-Jan-28,CARANDAITI,LISAROACH@HOTMAIL.COM +338,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,27-Sep-20,STEPHEN_WOODARD,M,28-Jan-10,DOCTOR_DOMINGO_HAROSTEGUY,FLORESCHRISTOPHER@HOTMAIL.COM +339,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,27-Sep-20,CHRISTINA_BOONE,F,27-Jul-21,AEROPUERTO_EZEIZA,BETTYMCKAY@HOTMAIL.COM +340,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,27-Sep-20,CHRISTOPHER_MADDEN,M,18-Jun-55,PUENTE_DEL_INCA,NICHOLASMONTGOMERY@YAHOO.COM +341,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,27-Sep-20,BOBBY_LOPEZ,M,10-Apr-96,BARRIO_1_DE_MAYO,ANDERSONSTEPHANIE@HOTMAIL.COM +342,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,27-Sep-20,JENNIFER_SHARP,F,10-May-28,25_DE_MAYO,ONEALNICOLE@GMAIL.COM +343,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,27-Sep-20,MELISSA_WARD,F,01-Feb-35,COLONIA_RIVAS,WHITAKERKATHERINE@HOTMAIL.COM +344,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,27-Sep-20,HALEY_WILLIAMS,F,02-May-93,AMBROSIO_P_LEZICA,MCGUIREKAREN@GMAIL.COM +345,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,28-Sep-20,COURTNEY_BAILEY,F,20-Mar-08,ABRA_RICA,JOSEPH58@HOTMAIL.COM +346,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,28-Sep-20,JOHN_HARRIS,M,21-Nov-28,BELLOCQ,BRYANCARMEN@GMAIL.COM +347,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,28-Sep-20,BRIAN_ROJAS,M,24-Dec-71,LA_CHIRLANDIA,SHARONMCCARTY@YAHOO.COM +348,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,28-Sep-20,JONATHAN_OCHOA,M,31-Aug-98,LA_SALADA,CHRISTYMOODY@HOTMAIL.COM +349,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,28-Sep-20,CLAIRE_LUCAS,F,19-Jul-14,AGUA_DE_DIONISIO,WOODSLISA@HOTMAIL.COM +350,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,28-Sep-20,WILLIAM_CUNNINGHAM,M,06-Aug-91,AGUADA_DE_GUERRA,NICOLE75@GMAIL.COM +351,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,28-Sep-20,DANIEL_REID,M,09-Jan-57,LIERRA_ADJEMIRO,YGONZALEZ@YAHOO.COM +352,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,28-Sep-20,DANIEL_EVANS,M,25-Sep-65,CROTTO,MAXWELLTERESA@HOTMAIL.COM +353,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,28-Sep-20,TAMMY_KING,F,25-Feb-12,LA_PORTEÑA,CARRILLOMARY@YAHOO.COM +354,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,28-Sep-20,ANDREW_SULLIVAN,M,17-Jul-80,ARBOL_VERDE,KIMBERLYSCHNEIDER@HOTMAIL.COM +355,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,28-Sep-20,ERIC_HERNANDEZ,M,26-Jul-18,CAVOUR,CHICKMAN@GMAIL.COM +356,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,28-Sep-20,STEPHANIE_RICHARDSON,F,20-Dec-82,17_DE_AGOSTO,JULIALOPEZ@YAHOO.COM +357,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,28-Sep-20,CHRISTINE_RUBIO,F,25-Jun-75,ARROYO_HONDO,JASONROBINSON@GMAIL.COM +358,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,29-Sep-20,MATTHEW_BOLTON,M,26-Oct-97,ALLEN,THOMASOBRIEN@YAHOO.COM +359,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,29-Sep-20,DAISY_TYLER,F,13-Mar-70,CABAÑA_EL_CISNE,RODNEY66@GMAIL.COM +360,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,29-Sep-20,MICHELLE_WADE,F,31-Mar-09,ALASTUEY,KLEWIS@GMAIL.COM +361,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,29-Sep-20,MICHAEL_DOMINGUEZ,M,06-Jul-09,ACHALCO,DONNAPEREZ@GMAIL.COM +362,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,29-Sep-20,TRACI_JUAREZ,F,03-Feb-70,ABRALAITE,GRIMESCYNTHIA@GMAIL.COM +363,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,29-Sep-20,BRITTNEY_SPARKS,F,24-Feb-62,AGUA_DE_CASTILLA,ERICABOWERS@GMAIL.COM +364,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,29-Sep-20,VALERIE_MAYNARD,F,02-Aug-41,FRIGORIFICO_CAP,FOWLERERIK@YAHOO.COM +365,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,29-Sep-20,BRITTNEY_COLE,F,10-Aug-34,COMANDANTE_GIRIBONE,JAMESMAYER@YAHOO.COM +366,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,29-Sep-20,MONICA_FARLEY,F,02-Oct-72,CAÑADA_RICA,MARIA48@YAHOO.COM +367,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,29-Sep-20,JOHN_FLORES,M,05-Dec-16,AGUADA_CHACAY_CO,CHURCHMIGUEL@GMAIL.COM +368,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,29-Sep-20,KEVIN_BOYLE,M,19-Jan-24,HITO_45,NBRADFORD@HOTMAIL.COM +369,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,29-Sep-20,CARL_WASHINGTON,M,04-Jul-48,6_DE_SEPTIEMBRE,FOXMICHAEL@GMAIL.COM +370,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,29-Sep-20,TODD_FRAZIER,M,12-Jun-30,ALBERTO_FLORES,AMYNEAL@GMAIL.COM +371,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,29-Sep-20,TRACY_MONTGOMERY,F,25-Jul-29,ESTANCIAS,KEITHHERNANDEZ@GMAIL.COM +372,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,29-Sep-20,LORI_ANDERSON,F,11-May-20,ALVARO_BARROS,RACHELREYNOLDS@HOTMAIL.COM +373,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,30-Sep-20,JENNIFER_ZUNIGA,F,02-Sep-85,BARRANQUITAS,VINCENTLAURA@GMAIL.COM +374,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,30-Sep-20,JESSICA_WILSON,F,31-Jan-48,CORONEL_GRANADA,GPAGE@YAHOO.COM +375,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,30-Sep-20,RONNIE_SANDERS,M,20-Oct-15,EL_TRIGO,KARAYATES@YAHOO.COM +376,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,30-Sep-20,YVONNE_JOHNSON,F,05-Sep-32,BENITO_JUAREZ,MCDONALDAARON@GMAIL.COM +377,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,30-Sep-20,HANNAH_HALL,F,30-Dec-48,AGUADA,HEATHER32@GMAIL.COM +378,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,30-Sep-20,JENNIFER_RAY,F,28-Sep-16,COLONIA_ALBERDI,DAVID54@YAHOO.COM +379,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,30-Sep-20,MEGHAN_SMITH,F,27-Dec-80,CAMPO_LA_RIVIERE,RTAYLOR@YAHOO.COM +380,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,30-Sep-20,DALE_PATEL,M,22-Nov-08,4_DE_NOVIEMBRE,EDUKE@HOTMAIL.COM +381,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,30-Sep-20,DANIEL_COHEN,M,13-Nov-83,LEHMANN,FRANKSMITH@HOTMAIL.COM +382,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,01-Oct-20,RYAN_CARLSON,M,03-Jul-69,HARAS_SAN_JACINTO,JROMERO@GMAIL.COM +383,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,01-Oct-20,GRANT_RUIZ,M,25-Jan-26,CAÑADON_SECO,WEAVERBARBARA@GMAIL.COM +384,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,01-Oct-20,ERICA_NELSON,F,03-Feb-42,ALPACHIRI,ANTHONY24@YAHOO.COM +385,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,01-Oct-20,KAREN_GAMBLE,F,26-Oct-20,CAMPO_PESOA,STEPHANIEBERRY@YAHOO.COM +386,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,01-Oct-20,CHRISTOPHER_RUSSELL,M,04-Apr-46,BELLOCQ,PATTERSONJEREMY@GMAIL.COM +387,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,01-Oct-20,ANTHONY_KENNEDY,M,16-Feb-04,JESUS_MARIA,ALEXANDRA42@GMAIL.COM +388,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,01-Oct-20,JEFFREY_SMITH,M,18-Oct-32,ANGEL_GALLARDO,ZTAYLOR@GMAIL.COM +389,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,01-Oct-20,LAURA_RIDDLE,F,22-May-32,ESTEBAN_DE_LUCA,JOSHUARIVERA@HOTMAIL.COM +390,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,01-Oct-20,MADELINE_CARSON,F,22-Jul-31,BOCAYUBA,CHRISTOPHER85@YAHOO.COM +391,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,01-Oct-20,ANNA_LOWE,F,20-Jun-04,AGUAS_DE_LAS_MULAS,OHUNT@YAHOO.COM +392,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,01-Oct-20,ANGELA_NGUYEN,F,13-Jun-06,ARROYO_SALADO,MEGAN93@GMAIL.COM +393,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,01-Oct-20,JOSHUA_SPEARS,M,03-May-64,ENCINA,PSANDERS@HOTMAIL.COM +394,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,01-Oct-20,REGINA_BRIGGS,F,18-Jun-66,ARROYO_PESCADO,KATELYN31@GMAIL.COM +395,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,01-Oct-20,DAVID_BROWN,M,10-Dec-94,BLANDENGUES,CARTERKEITH@HOTMAIL.COM +396,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,01-Oct-20,JESSICA_SANTIAGO,F,26-Oct-26,ALPACHIRI,DAWN33@YAHOO.COM +397,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,02-Oct-20,MELISSA_ROSS,F,20-Feb-62,10_DE_MAYO,WILLIAM11@GMAIL.COM +398,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,02-Oct-20,HEATHER_WILLIAMS,F,22-Jun-92,ALTO_LAS_LECHUZAS,CHERYLCHAN@GMAIL.COM +399,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,02-Oct-20,KEVIN_HARMON,M,24-Aug-18,LA_FLORENCIA,BISHOPPATRICK@HOTMAIL.COM +400,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,02-Oct-20,CHRISTINA_GUTIERREZ,F,23-Dec-65,BUSTAMANTE,SMITHMELANIE@HOTMAIL.COM +401,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,02-Oct-20,GARY_HAYS,M,16-Apr-07,AGUAYO,DANIELMENDOZA@HOTMAIL.COM +402,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,02-Oct-20,KRISTI_CHERRY,F,03-Jul-62,WILDE,ZRIVERA@GMAIL.COM +403,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,02-Oct-20,STEPHANIE_MARTIN,F,05-Dec-34,CERES,NSANCHEZ@YAHOO.COM +404,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,02-Oct-20,ANDREW_MULLINS,M,11-Aug-01,CAMPO_HUBER,MILLERLUIS@YAHOO.COM +405,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,02-Oct-20,CRAIG_AUSTIN,M,19-Mar-62,ALDEA_APELEG,HERNANDEZREBECCA@HOTMAIL.COM +406,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,02-Oct-20,JUSTIN_HOWELL,M,09-May-40,ALANICES,CRYSTALTAYLOR@GMAIL.COM +407,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,02-Oct-20,HEATHER_MILLER_MD,F,22-Jun-39,COLONIA_JAPONESA,COURTNEYGONZALEZ@GMAIL.COM +408,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,02-Oct-20,DUSTIN_WILSON,M,18-Jun-20,WILDE,KFRYE@HOTMAIL.COM +409,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,02-Oct-20,WESLEY_HORNE,M,04-Apr-35,BOCAS,XARCHER@YAHOO.COM +410,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,02-Oct-20,MATTHEW_MOODY,M,02-Jan-33,COLONIA_HANSEN,GONZALEZKELSEY@HOTMAIL.COM +411,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,03-Oct-20,KATIE_SAUNDERS,F,14-Jan-65,LAS_PALMAS,OFREEMAN@YAHOO.COM +412,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,03-Oct-20,NICOLE_STEWART_DVM,F,19-Aug-25,ALTO_JAGUEL,COLLINSPAUL@GMAIL.COM +413,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,03-Oct-20,TIMOTHY_TOWNSEND,M,24-Nov-78,CARLOS_PELLEGRINI,JOHN38@GMAIL.COM +414,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,03-Oct-20,BRIAN_REYNOLDS,M,27-Jan-23,BARRIO_EL_TONTAL,MATTHEWADAMS@HOTMAIL.COM +415,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,03-Oct-20,MARIE_MASON,F,06-Oct-34,ATREUCO,DANIELFLOWERS@YAHOO.COM +416,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,03-Oct-20,RYAN_REYES,M,23-Oct-40,7_DE_ABRIL,ANDRADEAPRIL@GMAIL.COM +417,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,03-Oct-20,SARAH_ROACH,F,22-Nov-17,EL_HOYO,HAROLDADAMS@YAHOO.COM +418,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,03-Oct-20,JOSEPH_CLARK,M,10-Jul-36,FARO_SAN_ANTONIO,MOOREMARK@YAHOO.COM +419,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,03-Oct-20,KEVIN_CARPENTER,M,25-Feb-36,AGUA_DE_CASTILLA,LOPEZCATHERINE@GMAIL.COM +420,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,04-Oct-20,REBECCA_BERRY,F,28-Sep-56,ARTURO_SEGUI,BHAMILTON@GMAIL.COM +421,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,04-Oct-20,BENJAMIN_PETERSEN,M,19-May-05,AGUA_COLORADA,JEFFREYYOUNG@YAHOO.COM +422,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,04-Oct-20,JEAN_KELLY,F,03-Oct-59,VILLA_MANZANO,QLEWIS@YAHOO.COM +423,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,04-Oct-20,STEVEN_MARTIN,M,17-Jun-16,ANGOSTURA,BENJAMINANDERSON@YAHOO.COM +424,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,04-Oct-20,ALLISON_RILEY,F,30-Apr-74,VILLA_ANGELICA,AMY77@GMAIL.COM +425,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,04-Oct-20,ANTHONY_KING,M,12-Jan-40,JOSE_FERRARI,JSHELTON@YAHOO.COM +426,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,04-Oct-20,JOSEPH_KENT,M,22-Sep-40,PEYRANO,BRANDONMCCORMICK@HOTMAIL.COM +427,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,04-Oct-20,NATASHA_MATTHEWS,F,07-Jul-62,EREZCANO,CHANGSTEPHANIE@GMAIL.COM +428,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,04-Oct-20,JOSHUA_PEREZ,M,23-Jul-19,COOPER,TCHRISTIAN@GMAIL.COM +429,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,04-Oct-20,TONY_JOHNSON,M,28-Nov-23,HARAS_SAN_JACINTO,GARCIAVINCENT@YAHOO.COM +430,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,04-Oct-20,ROBIN_GRANT,F,09-Jun-22,ARROYO_QUILLA,CHARLESEDWARDS@HOTMAIL.COM +431,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,04-Oct-20,ROBERT_HERNANDEZ,M,04-Mar-04,ALTO_CON_ZAMPA,WRIGHTLEONARD@HOTMAIL.COM +432,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,04-Oct-20,JOHN_GRAY,M,16-Sep-19,VILLA_ROSA,BOONEPRESTON@GMAIL.COM +433,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,05-Oct-20,ASHLEY_BROWN,F,08-Jan-84,COLONIA_HANSEN,ROBERTSROBERT@YAHOO.COM +434,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,05-Oct-20,PAMELA_PHILLIPS,F,18-Jul-16,BANDA_VARELA,MPOPE@GMAIL.COM +435,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,05-Oct-20,JONATHAN_OROZCO,M,02-Jul-15,ALGARROBAL_PUISOYE,NICOLE35@HOTMAIL.COM +436,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,05-Oct-20,SEAN_DAVIS,M,15-Feb-07,ALPACHIRI,JELLIOTT@YAHOO.COM +437,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,05-Oct-20,JOSE_HICKS,M,10-Nov-24,ALVARO_BARROS,ANDERSONANDREW@YAHOO.COM +438,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,05-Oct-20,TOM_ROSE_MD,M,24-Jun-45,AMERICA,ELIZABETHWOODS@HOTMAIL.COM +439,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,05-Oct-20,LISA_GONZALEZ,F,22-Oct-47,ANGACO_NORTE,MILLERJONATHON@GMAIL.COM +440,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,05-Oct-20,ROBERTO_BLACK,M,18-Feb-33,ATALAYA,DJACKSON@HOTMAIL.COM +441,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,05-Oct-20,SHANNON_JONES,F,02-Jun-79,BARADERO,JOHNSONANTHONY@YAHOO.COM +442,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,05-Oct-20,MICHAEL_GONZALEZ,M,24-Oct-56,COLONIA_EGIDO,ATKINSONCHARLES@HOTMAIL.COM +443,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,05-Oct-20,VICTOR_WHITE,M,18-Oct-93,CHIMPAY,CAMPBELLASHLEY@YAHOO.COM +444,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,05-Oct-20,PATRICK_JACKSON,M,25-Feb-25,AERO_CLUB_ROSARIO,DEANNA37@YAHOO.COM +445,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,05-Oct-20,JOSEPH_MCGUIRE,M,04-Jan-43,COLONIA_HINOJO,DAWN77@YAHOO.COM +446,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,06-Oct-20,EMMA_BALL,F,13-May-21,TRISTAN_SUAREZ,ZBUCKLEY@HOTMAIL.COM +447,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,06-Oct-20,COURTNEY_KIRK,F,06-Jul-68,CAMPO_MEDINA,MBREWER@GMAIL.COM +448,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,06-Oct-20,AMY_WALLACE,F,31-Mar-12,CATARATAS_DEL_IGUAZU,DAVIDHESS@HOTMAIL.COM +449,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,06-Oct-20,NOAH_HARRIS,M,18-Nov-98,ARROYO_PALMAR,OSUMMERS@GMAIL.COM +450,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,06-Oct-20,BRENDA_WALKER,F,24-Nov-07,BERDUC,SHEPHERDCARL@GMAIL.COM +451,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,06-Oct-20,CHAD_BOOKER,M,07-Jul-37,BUENA_VISTA,JENNIFERSANCHEZ@GMAIL.COM +452,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,07-Oct-20,DEBBIE_HOLDEN,F,22-Jan-22,ALTO_LINDO,TURNERPAMELA@GMAIL.COM +453,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,07-Oct-20,SHERRY_GONZALEZ,F,29-Jul-29,9_DE_JULIO,AFLEMING@HOTMAIL.COM +454,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,07-Oct-20,DR._MARY_PEREZ,F,28-Aug-04,AGUA_DE_LAS_PALOMAS,VIRGINIAROBERTS@HOTMAIL.COM +455,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,07-Oct-20,KYLIE_REYES,F,06-Jan-03,AGUADA_GUZMAN,CHRISTOPHERRIVERA@GMAIL.COM +456,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,07-Oct-20,JESSE_RODRIGUEZ,M,18-May-54,LA_MOROCHA,URANGEL@HOTMAIL.COM +457,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,07-Oct-20,SUSAN_FULLER,F,29-Jan-69,CHIVILCOY,REGINA66@YAHOO.COM +458,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,07-Oct-20,ANTHONY_GARNER,M,25-Feb-53,SAN_MAYOL,JOSEPHDAVIS@HOTMAIL.COM +459,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,07-Oct-20,HECTOR_GARZA,M,11-Feb-34,SAN_FERNANDO,TRACYMORALES@YAHOO.COM +460,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,07-Oct-20,ANDREW_BELTRAN,M,15-Oct-17,COLONIA_ESPAÑA,BARBARAORTIZ@HOTMAIL.COM +461,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,07-Oct-20,JOHN_ROMERO,M,26-Jul-21,LA_UNION,SBARBER@YAHOO.COM +462,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,07-Oct-20,ANGELICA_HOFFMAN,F,29-Apr-13,PUERTO_OJO_DE_AGUA,MBOYD@HOTMAIL.COM +463,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,07-Oct-20,MAUREEN_LONG,F,18-Aug-22,ABALO,NATHANIEL42@HOTMAIL.COM +464,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,08-Oct-20,SHERI_QUINN,F,27-Apr-84,SAN_MAYOL,DEREK21@GMAIL.COM +465,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,08-Oct-20,MATTHEW_COLE,M,19-Aug-49,ARROYO_DEL_REY,THOMASCYNTHIA@YAHOO.COM +466,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,08-Oct-20,PAMELA_MANN,F,25-Dec-72,ALDEA_FORESTAL,CAMPOSAMBER@YAHOO.COM +467,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,08-Oct-20,STEVEN_HARDY,M,01-Dec-18,CORONEL_BOERR,DARRELLJIMENEZ@YAHOO.COM +468,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,08-Oct-20,DWAYNE_DENNIS,M,10-Aug-11,ARROYO_MOLINO,ROBERTSONMORGAN@HOTMAIL.COM +469,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,08-Oct-20,BRIAN_FOLEY,M,02-Jul-89,ALBERTO_GERCHUNOFF,TRACI74@GMAIL.COM +470,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,08-Oct-20,SHAWN_RICHARDSON,M,04-Jul-02,CHOCORI,RAMIREZGINA@YAHOO.COM +471,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,08-Oct-20,MR._CURTIS_NGUYEN,M,04-Jan-36,BELLA_ITALIA,JACKSONCRYSTAL@HOTMAIL.COM +472,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,08-Oct-20,SUSAN_LEBLANC,F,26-Apr-18,ALBARRACIN,MMORALES@YAHOO.COM +473,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,08-Oct-20,JAMES_MARTIN,M,20-Oct-83,PUNTA_LARA,JANICE49@GMAIL.COM +474,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,08-Oct-20,TAYLOR_MCMAHON,F,03-Feb-10,SAN_JOSE,JONESJENNA@HOTMAIL.COM +475,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,09-Oct-20,JACOB_HICKMAN,M,31-Jan-07,ABBOTT,ANDERSONMELISSA@GMAIL.COM +476,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,09-Oct-20,JACOB_THOMAS,M,15-Sep-47,AGUA_COLORADA,PAUL06@GMAIL.COM +477,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,09-Oct-20,JESSICA_JONES,F,04-Jun-06,ARROYO_URQUIZA,MCBRIDEJOHN@GMAIL.COM +478,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,09-Oct-20,JENNIFER_BECK_DVM,F,20-May-55,SANTA_TERESITA,HATFIELDJOHNATHAN@GMAIL.COM +479,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,09-Oct-20,LISA_FOSTER,F,24-Jan-49,25_DE_MAYO,IPOTTER@HOTMAIL.COM +480,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,10-Oct-20,DAVID_MASON,M,12-May-38,BEALISTOCK,GABRIELLE52@GMAIL.COM +481,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,10-Oct-20,TYLER_KERR,M,19-May-63,HUANQUEROS,COLEMELISSA@GMAIL.COM +482,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,10-Oct-20,WILLIAM_ROGERS,M,10-Jan-17,CATARATAS_DEL_IGUAZU,BLAKE61@YAHOO.COM +483,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,10-Oct-20,BRANDON_JONES,M,18-Feb-85,JUAN_VUCETICH_EX_DR_R_LEVENE,ISMITH@HOTMAIL.COM +484,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,10-Oct-20,JUSTIN_GARDNER,M,19-May-99,KILOMETRO_374,ABROWN@GMAIL.COM +485,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,10-Oct-20,STEVEN_SCOTT,M,12-Jul-13,BANDA_FLORIDA,YOUNGSHELBY@YAHOO.COM +486,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,10-Oct-20,THOMAS_WILSON,M,10-Sep-41,16_DE_JULIO,JODYSMITH@HOTMAIL.COM +487,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,10-Oct-20,AMBER_SMITH,F,24-Apr-15,AGUSTONI,STEELEJOHN@HOTMAIL.COM +488,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,10-Oct-20,MARC_MORROW,M,14-Mar-86,LOMAS_DE_ZAMORA,KARINA37@YAHOO.COM +489,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,10-Oct-20,CARL_BALDWIN,M,26-Mar-88,CAMPAMENTO_SOL,ROBERTVALDEZ@GMAIL.COM +490,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,10-Oct-20,DENNIS_SIMPSON,M,26-Apr-00,COLONIA_MONTE_LA_PLATA,INGRAMDONALD@GMAIL.COM +491,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,10-Oct-20,ROBIN_ROWLAND,F,14-Sep-10,ALTAMIRANO_NORTE,ASHLEYBROWN@HOTMAIL.COM +492,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,11-Oct-20,RICHARD_JONES,M,19-Sep-64,FIRMAT,TERESA84@YAHOO.COM +493,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,11-Oct-20,ANTHONY_WATKINS,M,22-Feb-17,LOS_CORREDORES,DMURRAY@HOTMAIL.COM +494,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,11-Oct-20,DANIEL_HERNANDEZ,M,03-Jul-73,CHAVARRIA,JIMCHAVEZ@HOTMAIL.COM +495,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,11-Oct-20,DAWN_SAUNDERS,F,12-Mar-54,ANILLACO,CHRISTOPHER56@HOTMAIL.COM +496,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,11-Oct-20,MICHAEL_SPENCER,M,01-Apr-28,CAMINERA_SAMBOROMBON,JACK76@GMAIL.COM +497,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,11-Oct-20,MICHAEL_LAMB,M,06-Oct-34,KILOMETRO_77,RACHEL86@HOTMAIL.COM +498,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,11-Oct-20,PAUL_THOMAS,M,18-Oct-57,BENITO_JUAREZ,NDELEON@HOTMAIL.COM +499,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,11-Oct-20,TARA_COLLINS,F,17-Nov-69,BURZACO,OFLORES@YAHOO.COM +500,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,11-Oct-20,BRIAN_HOWARD,M,27-Jul-41,BONPLAND,SUE21@HOTMAIL.COM +501,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,11-Oct-20,ANDREW_SULLIVAN,M,02-Oct-46,FRANCISCO_ALVAREZ,OMARVASQUEZ@YAHOO.COM +502,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,11-Oct-20,HAYDEN_JENNINGS,M,09-May-63,COLONIA_LA_NEGRA,JULIAJOHNSON@GMAIL.COM +503,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,11-Oct-20,STEVEN_KEITH,M,18-Dec-47,ISLA_LOS_LAURELES,PATRICIA80@YAHOO.COM +504,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,11-Oct-20,JULIA_WEBB,F,20-Jul-65,EL_ESPINILLO,DLEE@HOTMAIL.COM +505,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,11-Oct-20,JEFFREY_HOUSTON,M,29-Aug-71,ESTACION_YERUA,DEBORAH60@GMAIL.COM +506,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,11-Oct-20,JAMES_DOUGHERTY,M,22-May-54,BUENA_NUEVA,DENNISCONWAY@YAHOO.COM +507,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,11-Oct-20,ZACHARY_BROWN,M,25-Sep-61,ALFEREZ_SAN_MARTIN,TRAVISHOUSTON@YAHOO.COM +508,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,11-Oct-20,KIMBERLY_DIAZ,F,12-Dec-06,CAÑADON_CHILENO,DAVID99@GMAIL.COM +509,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,12-Oct-20,BONNIE_MATHEWS,F,01-Jul-77,ALFREDO_PEÑA,CURTISPARKER@YAHOO.COM +510,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,12-Oct-20,RACHAEL_RICHARDSON,F,19-Apr-84,CARACOLES,WALKERJAMES@YAHOO.COM +511,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,12-Oct-20,RICKY_REESE,M,20-Jan-22,BARRIO_FERRI,HASHLEY@GMAIL.COM +512,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,12-Oct-20,ANN_ALVAREZ,F,26-Mar-22,COMANDANTE_NICANOR_OTAMENDI,KHANLISA@GMAIL.COM +513,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,12-Oct-20,RICKY_DELGADO,M,28-Apr-94,VIRREY_DEL_PINO,JUSTINCHAVEZ@YAHOO.COM +514,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,12-Oct-20,JASON_MEYER,M,11-Jun-44,CLAYPOLE,CLEWIS@HOTMAIL.COM +515,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,12-Oct-20,TIMOTHY_JOHNSTON,M,15-Jun-29,BME_BAVIO_GRAL_MANSILLA,RYAN49@GMAIL.COM +516,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,12-Oct-20,KATHERINE_BOND,F,18-Jun-38,AGOTE,IANDRADE@GMAIL.COM +517,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,12-Oct-20,HOWARD_ANDRADE,M,29-Aug-83,ARROYO_DE_LA_CRUZ,MARKHILL@GMAIL.COM +518,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,12-Oct-20,TIFFANY_ELLIS,F,07-Jun-34,ARRASCAETA,ROGERSLISA@HOTMAIL.COM +519,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,12-Oct-20,RICKY_KING,M,26-Aug-14,AGUADA_CHACAY_CO,PAYNESARAH@GMAIL.COM +520,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,12-Oct-20,SEAN_MILLER,M,07-Mar-07,FUNKE,RUSSELLBRYAN@HOTMAIL.COM +521,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,12-Oct-20,KIMBERLY_BROWN,F,29-Sep-26,CAÑADA,XHAHN@HOTMAIL.COM +522,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,12-Oct-20,MICHAEL_THOMPSON,M,21-Oct-18,COLONIA_CUNCI,QJOHNSON@HOTMAIL.COM +523,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,12-Oct-20,KENNETH_LYNN,M,26-Apr-04,AGUA_COLORADA,THERESAMUNOZ@GMAIL.COM +524,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,12-Oct-20,BRIAN_BUCKLEY,M,12-Jun-72,CAMPO_QUIRNO,BROWNINGCHRISTOPHER@GMAIL.COM +525,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,12-Oct-20,TIMOTHY_GRAVES,M,07-Jan-16,CAMPO_DE_TALAMAYO,TERRI10@YAHOO.COM +526,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,13-Oct-20,LOGAN_THOMAS,M,01-Oct-62,CAAGUAZU,PCLARK@YAHOO.COM +527,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,13-Oct-20,BRIAN_CHARLES,M,06-Aug-17,ALIZAL,VTHOMAS@GMAIL.COM +528,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,13-Oct-20,KIMBERLY_WIGGINS,F,05-Feb-38,BARROS_PAZOS,ANDREWRANDOLPH@GMAIL.COM +529,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,13-Oct-20,GINA_STEVENS,F,05-Jun-74,COLONIA_TACURALES,JASMINE29@HOTMAIL.COM +530,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,13-Oct-20,EDWIN_ESPARZA,M,17-Aug-20,MAORI,QFARMER@HOTMAIL.COM +531,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,13-Oct-20,WILLIAM_BARAJAS,M,06-Mar-75,BARROS_PAZOS,RANDYONEILL@GMAIL.COM +532,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,13-Oct-20,JENNIFER_CLARK,F,08-Feb-86,CAÑADA_DE_LAS_OVEJAS,YJONES@YAHOO.COM +533,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,13-Oct-20,TIFFANY_JENSEN,F,13-Aug-29,VILLA_SAUCE,WSHELTON@HOTMAIL.COM +534,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,13-Oct-20,TIFFANY_MARTINEZ,F,22-Jan-08,BAÑADO_NORTE,CROSS@HOTMAIL.COM +535,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,13-Oct-20,STEVEN_CLEMENTS,M,29-Mar-66,ACOSTILLA,KATHERINEVEGA@YAHOO.COM +536,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,13-Oct-20,RONALD_GOULD,M,05-Feb-34,ARROYO_DULCE,QMANN@YAHOO.COM +537,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,13-Oct-20,VINCENT_HILL,M,29-Jun-29,CATARATAS_DEL_IGUAZU,HANNAHCOLLINS@GMAIL.COM +538,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,13-Oct-20,JAMES_MORENO,M,30-Sep-16,1_DE_MAYO,SANDRAREYNOLDS@YAHOO.COM +539,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,13-Oct-20,KARA_WHITE,F,14-Jul-06,ATAHUALPA,TPOWERS@GMAIL.COM +540,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,13-Oct-20,DANIELLE_WOOD,F,29-Jun-62,ALIZAL,HKELLER@YAHOO.COM +541,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,13-Oct-20,STEPHANIE_PETERS,F,12-Jan-31,BALNEARIO_CHAPALCO,STEPHENRIVERA@YAHOO.COM +542,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,14-Oct-20,LUIS_ALLEN,M,11-Dec-79,COLONIA_EGIDO,YCOHEN@HOTMAIL.COM +543,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,14-Oct-20,KAREN_GRANT,F,19-Jun-21,ANTONIO_TOMAS_SUD,ISAIAHCONTRERAS@YAHOO.COM +544,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,14-Oct-20,JENNY_ZIMMERMAN,F,17-Jul-96,AGUAYO,RWILSON@GMAIL.COM +545,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,14-Oct-20,CHAD_ROCHA,M,14-Nov-17,LOS_FRENTONES,JOHN25@HOTMAIL.COM +546,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,14-Oct-20,JUAN_MILLER,M,21-Jul-35,CAÑADON_CHILENO,ERIC77@YAHOO.COM +547,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,14-Oct-20,MARGARET_MOORE,F,26-Feb-71,AVELLANEDA,BROWNCATHERINE@YAHOO.COM +548,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,14-Oct-20,CONNOR_STRICKLAND,M,08-Feb-04,CENTRO_AGRICOLA_EL_PATO,BALDWINALYSSA@YAHOO.COM +549,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,14-Oct-20,GAIL_WALKER,F,20-Sep-12,CRISTOLIA,UCHUNG@GMAIL.COM +550,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,14-Oct-20,CASSANDRA_STEELE,F,12-Dec-23,CAMET,VANDERSON@HOTMAIL.COM +551,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,14-Oct-20,MATTHEW_HARRISON,M,16-Sep-87,DESTILERIA_FISCAL,KIRBYMICHAEL@GMAIL.COM +552,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,14-Oct-20,BRIANNA_MASSEY,F,13-May-09,BARRANQUITAS,KELLY33@HOTMAIL.COM +553,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,14-Oct-20,DAVID_HALL,M,27-Dec-35,COLONIA_LOS_SAUCES,CAMACHOJESSICA@GMAIL.COM +554,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,14-Oct-20,MIGUEL_HESTER,M,03-Feb-19,GANDOLFI,ANTHONYBARBER@HOTMAIL.COM +555,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,14-Oct-20,KIMBERLY_ALEXANDER,F,15-Dec-29,AMBROSIO_P_LEZICA,JWEEKS@HOTMAIL.COM +556,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,14-Oct-20,CHELSEY_DURHAM,F,10-Apr-83,COLONIA_ALBERDI,ROBLESTHOMAS@GMAIL.COM +557,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,14-Oct-20,JANET_MARTIN,F,17-Jul-03,BOUQUET,GSANDERS@HOTMAIL.COM +558,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,14-Oct-20,ANGELA_STOKES,F,07-Oct-18,BARRIO_VILLA_ADELA,BAXTERMICHAEL@HOTMAIL.COM +559,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,14-Oct-20,SHELLEY_COOPER,F,01-Jul-14,ALSINA,JMCGUIRE@HOTMAIL.COM +560,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,14-Oct-20,COREY_JIMENEZ,M,14-Mar-92,BATAVIA,HARRISONANTHONY@YAHOO.COM +561,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,14-Oct-20,TRACY_COLE,M,16-Jul-22,KILOMETRO_184,CALDWELLJENNIFER@YAHOO.COM +562,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,14-Oct-20,KAYLEE_SMITH,F,23-Nov-82,COLONIA_RIVAS,SIMSEMILY@GMAIL.COM +563,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,15-Oct-20,PAMELA_GONZALEZ,F,19-Jul-62,BALDE_DE_LEYES,JENNIFER84@GMAIL.COM +564,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,15-Oct-20,CHRISTINE_FLORES,F,28-Oct-12,ISLA_GRAN_MALVINA,HOLLYELLISON@HOTMAIL.COM +565,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,15-Oct-20,NANCY_GARDNER,F,21-Dec-25,CARMEN_DE_ARECO,JASON02@YAHOO.COM +566,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,15-Oct-20,MELINDA_SHELTON,F,19-Sep-11,BALCARCE,BROWNMEGAN@HOTMAIL.COM +567,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,15-Oct-20,JILL_SMITH,F,21-Oct-57,BURZACO,JOHNSIMMONS@YAHOO.COM +568,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,15-Oct-20,MICHAEL_BROWN,M,29-Mar-60,CAMPANA,DENNIS56@GMAIL.COM +569,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,15-Oct-20,MICHAEL_ANDERSON,M,09-Nov-35,DEL_VALLE,LAMBDONNA@YAHOO.COM +570,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,15-Oct-20,VICTORIA_COLE,F,08-Apr-97,3_DE_MAYO,JAMESJOSHUA@HOTMAIL.COM +571,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,15-Oct-20,MR._JOHN_PARKER,M,01-Dec-88,EL_TRIGO,EWEISS@YAHOO.COM +572,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,15-Oct-20,DR._MALIK_HENRY,M,03-Feb-75,ALCARAZ_1RO,FOXCARL@GMAIL.COM +573,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,15-Oct-20,CHAD_BENSON,M,11-Jul-46,COLONIA_CAMPO_PIAGGIO,DANIEL70@HOTMAIL.COM +574,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,15-Oct-20,NANCY_DIAZ,F,06-Jul-45,BOEUF,STANLEY99@GMAIL.COM +575,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,16-Oct-20,NICHOLAS_WOOD,M,14-Jul-43,BAHIA_CRACHER,LUCASDOUGLAS@GMAIL.COM +576,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,16-Oct-20,JESSICA_FLOYD,F,14-Jul-10,COLONIA_BELGA_AMERICANA,VALENCIAJULIE@GMAIL.COM +577,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,16-Oct-20,JOSHUA_RAY,M,25-Jul-63,CAMPO_ZAVALLA,MATTHEWMARSHALL@HOTMAIL.COM +578,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,16-Oct-20,CATHERINE_GALVAN,F,06-Mar-26,CARAHUNCO,EMILYSMITH@GMAIL.COM +579,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,16-Oct-20,DIANE_LARSEN,F,05-Jan-98,GENERAL_SAN_MARTIN,FMONTGOMERY@HOTMAIL.COM +580,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,16-Oct-20,TROY_AVERY,M,07-Dec-96,GOYENA,OMCINTYRE@GMAIL.COM +581,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,16-Oct-20,CRYSTAL_CAMPOS,F,22-Aug-18,ABALO,WEBSTERDON@GMAIL.COM +582,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,16-Oct-20,SHANNON_ROBERTSON,F,14-Dec-55,ARROYO_SANTA_MARIA,DEANNAHERNANDEZ@HOTMAIL.COM +583,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,16-Oct-20,KIMBERLY_HUFF,F,05-Jun-43,CORA,INEAL@GMAIL.COM +584,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,16-Oct-20,CHAD_WHITE,M,24-Jun-65,RICARDO_LAVALLE,SEAN80@YAHOO.COM +585,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,16-Oct-20,RICHARD_JONES,M,23-Jul-43,FLAMENCO,DENISE94@HOTMAIL.COM +586,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,16-Oct-20,JONATHAN_KIM,M,02-Aug-78,CENTELLA,DNIELSEN@GMAIL.COM +587,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,16-Oct-20,ANTHONY_BENTON,M,08-May-50,FUNKE,AARON46@YAHOO.COM +588,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,16-Oct-20,CAROL_DOUGLAS,F,14-Oct-07,DOCK_SUD,CRODRIGUEZ@HOTMAIL.COM +589,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,16-Oct-20,KAYLA_DIXON,F,22-Aug-66,AGUADA_CHACAY_CO,RYANWILLIAMS@YAHOO.COM +590,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,16-Oct-20,JOSEPH_GARDNER,M,31-May-89,13_DE_ENERO,HMARTIN@YAHOO.COM +591,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,17-Oct-20,GEORGE_BARRERA,M,09-Dec-92,CASBAS,FHARRIS@HOTMAIL.COM +592,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,17-Oct-20,JARED_ROLLINS,M,11-Oct-94,ACHICO,HOUSTONALEXANDER@GMAIL.COM +593,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,17-Oct-20,NICHOLAS_JOHNSON,M,21-Oct-23,LA_BLANQUEADA,JONATHAN79@HOTMAIL.COM +594,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,17-Oct-20,REGINA_THOMAS,F,21-Nov-84,VILLA_BALLESTER,ROBIN52@YAHOO.COM +595,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,17-Oct-20,DALTON_ROMAN,M,23-Nov-83,ARROYO_CORTO,REBECCAROSS@HOTMAIL.COM +596,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,17-Oct-20,CHRISTOPHER_HARPER,M,26-Feb-44,CAMPO_DEL_NORTE_AMERICANO,ROBERTCALLAHAN@HOTMAIL.COM +597,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,17-Oct-20,JAMES_WERNER,M,21-Feb-08,AGUADA,LEVINELAURIE@HOTMAIL.COM +598,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,17-Oct-20,BRYAN_KING,M,08-Mar-32,LOMAS_DE_ZAMORA,CHARLESBAILEY@HOTMAIL.COM +599,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,17-Oct-20,LISA_BELL,F,10-Jun-04,LA_TORRECITA,SARA34@GMAIL.COM +600,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,18-Oct-20,CONNIE_MOORE,F,14-Dec-02,EDMUNDO_PERKINS,WILLIAMSBRIAN@HOTMAIL.COM +601,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,18-Oct-20,EDWARD_GOMEZ,M,28-Jun-08,ALDEA_MARIA_LUISA,BROWNSERGIO@YAHOO.COM +602,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,18-Oct-20,JOSEPH_DAVIS,M,13-Apr-55,28_DE_NOVIEMBRE,MICHELE61@GMAIL.COM +603,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,18-Oct-20,JESSE_GRAHAM,M,01-Apr-05,ALTO_VERDE,DAVIDCAROLYN@YAHOO.COM +604,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,18-Oct-20,BRIAN_GILLESPIE,M,10-Nov-72,ADELA_CORTI,MICHAELHAMPTON@GMAIL.COM +605,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,18-Oct-20,CATHERINE_MORENO,F,13-Sep-72,COSTA_GRANDE,JOHNSONJEFFREY@YAHOO.COM +606,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,18-Oct-20,VICTORIA_SMITH,F,03-Aug-52,COLONIA_ESCRIBANO,FARMERCHERYL@YAHOO.COM +607,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,18-Oct-20,DESTINY_POWERS,F,04-Sep-06,BARRIO_GRAL_JOSE_DE_SAN_MARTIN,HICKSDENISE@YAHOO.COM +608,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,18-Oct-20,DEBRA_COHEN,F,10-Mar-64,CAMPO_CALVO,MERRITTTAMARA@HOTMAIL.COM +609,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,18-Oct-20,MICHELLE_CROSS,F,08-Aug-21,IFRAN,TCLARKE@HOTMAIL.COM +610,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,18-Oct-20,PAUL_CANNON,M,15-Jan-26,ERNESTINA,CODYDECKER@GMAIL.COM +611,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,18-Oct-20,MAUREEN_NGUYEN,F,11-Dec-70,EL_BOMBERO,FWILLIAMS@YAHOO.COM +612,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,18-Oct-20,DAWN_FREEMAN,F,15-Mar-47,FAVELLI,FLAWSON@YAHOO.COM +613,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,18-Oct-20,DANIEL_HOLLOWAY,M,14-Jul-56,HALE,ROBERTMENDEZ@GMAIL.COM +614,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,19-Oct-20,TAMMY_SCHMITT,F,18-Jun-27,LAS_PALMAS,ROY73@HOTMAIL.COM +615,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,19-Oct-20,MISTY_SNOW,F,28-Jan-86,BAHIA_CREEK,QERICKSON@HOTMAIL.COM +616,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,19-Oct-20,ERIC_HOWARD,M,07-Jul-93,EL_PAMPERO,IFRAZIER@YAHOO.COM +617,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,19-Oct-20,CAMERON_MITCHELL,M,25-Jan-91,ARROYO_DULCE,SJONES@HOTMAIL.COM +618,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,19-Oct-20,JAMES_PETERSON,M,12-Aug-12,ALDEA_SAN_ANTONIO,CPETERSON@HOTMAIL.COM +619,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,19-Oct-20,DEREK_SMITH,M,15-Jul-24,CAMPO_LA_NENA,WPERKINS@HOTMAIL.COM +620,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,19-Oct-20,STEPHEN_PONCE,M,29-Aug-06,DEFERRARI,MARIAWILSON@GMAIL.COM +621,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,19-Oct-20,RAYMOND_LEWIS,M,10-Feb-44,CHALLACO,MICHAELROBBINS@YAHOO.COM +622,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,19-Oct-20,AMY_LOPEZ,F,19-Nov-30,VILLA_BALLESTER,ORIVERS@GMAIL.COM +623,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,19-Oct-20,AMY_HARPER,F,18-Feb-62,LA_CHIRLANDIA,JEFFREYLEWIS@GMAIL.COM +624,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,19-Oct-20,MEAGAN_COOPER,F,09-Sep-25,DESPEÑADEROS,MGARCIA@HOTMAIL.COM +625,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,19-Oct-20,TODD_HARRELL,M,17-Apr-59,GUILLERMO_E_HUDSON,KELLYPROCTOR@YAHOO.COM +626,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,19-Oct-20,AMY_OLIVER,F,02-May-92,CAMPAMENTO_SOL,CONRADSHAWN@GMAIL.COM +627,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,19-Oct-20,ALEXANDRA_SAUNDERS,F,23-Jun-50,ARBOL_SOLO,THERESASHARP@GMAIL.COM +628,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,19-Oct-20,ADAM_SANDERS,M,10-Oct-49,LIBANO,TAYLORKELLER@YAHOO.COM +629,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,20-Oct-20,WILLIAM_KEMP,M,21-Feb-69,AYUI_PARADA,KENNEDYJOSEPH@GMAIL.COM +630,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,20-Oct-20,ELIZABETH_GREER,F,06-Dec-99,AGUADA_ALEGRE,RICEMELISSA@GMAIL.COM +631,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,20-Oct-20,CHARLENE_CUNNINGHAM,F,02-Oct-48,CAÑADA_LA_NEGRA,HENRYLONNIE@YAHOO.COM +632,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,20-Oct-20,MICHELLE_MEYER,F,17-Jul-09,AGUANGO,MARISAJOHNSON@YAHOO.COM +633,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,20-Oct-20,MICHAEL_CARRILLO,M,06-Feb-28,CORRENTOSO,MTHOMAS@GMAIL.COM +634,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,20-Oct-20,JAMES_MENDOZA,M,30-Jul-53,SAN_GERONIMO,KIMBERLY73@HOTMAIL.COM +635,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,20-Oct-20,WILLIAM_ADKINS,M,20-Jul-14,IRENEO_PORTELA,MATTHEW76@HOTMAIL.COM +636,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,20-Oct-20,WILLIAM_WHITE,M,09-Nov-63,BAJO_DE_RACO,STEPHANIE57@HOTMAIL.COM +637,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,20-Oct-20,DEBBIE_CHRISTIAN,F,12-Feb-50,ATUEL_SUD,PSMALL@YAHOO.COM +638,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,20-Oct-20,REGINALD_ALVARADO,M,10-May-03,CASTELAR,HUDSONJESSICA@YAHOO.COM +639,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,20-Oct-20,ALBERT_MITCHELL,M,18-Nov-59,CAMET,OLIVIA25@YAHOO.COM +640,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,20-Oct-20,ELIZABETH_MADDOX,F,31-Jul-57,EL_RETIRO,BWILLIAMS@YAHOO.COM +641,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,20-Oct-20,SHERRI_YU,F,27-Aug-13,LOS_ANTIGUOS,ROBERTARIAS@YAHOO.COM +642,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,20-Oct-20,JOE_ROGERS,M,07-Aug-83,MANUEL_B_GONNET,JOHNSONMICHELE@HOTMAIL.COM +643,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,21-Oct-20,JANE_MCBRIDE,F,07-Jun-53,CATARATAS_DEL_IGUAZU,NATASHAGATES@YAHOO.COM +644,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,21-Oct-20,AARON_MOORE,M,16-Nov-08,EL_PORVENIR,NICOLE59@YAHOO.COM +645,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,21-Oct-20,JESSICA_FLORES,F,07-Jul-14,COLONIA_BOMBAL_Y_TABANERA,JACKSONLINDSEY@HOTMAIL.COM +646,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,21-Oct-20,ALYSSA_MORALES,F,15-Dec-09,LA_BLANQUEADA,ZCOCHRAN@YAHOO.COM +647,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,21-Oct-20,ROBERTA_PETERSON,F,18-Jul-91,ADELA,PRICEELIZABETH@GMAIL.COM +648,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,21-Oct-20,SHAWN_SHEPPARD,M,01-Nov-77,BALDE_AHUMADA,BRYAN94@YAHOO.COM +649,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,21-Oct-20,JAMES_JACKSON,M,24-Feb-44,CALDERON,WNELSON@HOTMAIL.COM +650,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,21-Oct-20,BRENDA_MCGRATH,F,26-Jan-15,LOS_MOLINOS,OMOYER@YAHOO.COM +651,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,21-Oct-20,DAWN_MARTIN,F,30-May-75,BAHIA_BUSTAMANTE,FOXALEXANDRA@HOTMAIL.COM +652,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,21-Oct-20,BIANCA_FREEMAN,F,06-May-86,CANAL_15_CERRO_DE_LA_GLORIA,SAUNDERSDAVID@HOTMAIL.COM +653,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,21-Oct-20,WILLIAM_RICHARDSON,M,16-Dec-27,ALPACHIRI,BROWNTERESA@HOTMAIL.COM +654,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,21-Oct-20,RODNEY_MOORE,M,28-Dec-98,ANGEL_GALLARDO,ERICAROBINSON@HOTMAIL.COM +655,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,21-Oct-20,BRUCE_LANDRY,M,01-Dec-64,ARROYO_SALADO,ODAVIS@HOTMAIL.COM +656,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,21-Oct-20,MARIA_ROJAS,F,10-Aug-66,CAMPO_LAS_PUERTAS,SUEJONES@HOTMAIL.COM +657,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,21-Oct-20,GEORGE_ARMSTRONG,M,13-Oct-73,DE_BRUYN,TARAMARTINEZ@GMAIL.COM +658,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,21-Oct-20,ROBERT_AVERY,M,06-Jan-43,ARROYO,LEWISMARY@GMAIL.COM +659,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,21-Oct-20,DANIEL_RODRIGUEZ,M,03-Sep-91,COLONIA_LOS_BOSQUES,FLORESJOSEPH@HOTMAIL.COM +660,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,22-Oct-20,VANESSA_VAUGHN,F,30-Jul-14,AGUADITAS,LWOLFE@HOTMAIL.COM +661,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,22-Oct-20,JAMIE_WILSON,F,15-Jun-90,HUASA_PAMPA_NORTE,NELSONBRIAN@YAHOO.COM +662,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,22-Oct-20,ALICIA_NEWMAN,F,02-May-20,LA_SALADA,KELLEYAARON@GMAIL.COM +663,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,22-Oct-20,DIANE_SNYDER,F,03-Apr-29,COLONIA_SANTA_TERESA,XHAYDEN@HOTMAIL.COM +664,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,22-Oct-20,MICHAEL_EDWARDS,M,24-Apr-78,ALBERTI,BMAY@GMAIL.COM +665,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,22-Oct-20,ANTHONY_PATEL,M,04-Aug-40,ALEGRIA,KELLYMORALES@GMAIL.COM +666,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,22-Oct-20,JEFFREY_LEWIS,M,30-Jun-33,BARROS_PAZOS,CHRISTOPHER93@YAHOO.COM +667,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,23-Oct-20,LISA_RYAN,F,11-Jun-10,BALDE_DE_LEYES,SARAH60@GMAIL.COM +668,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,23-Oct-20,JOSE_HERMAN,M,16-Oct-80,AGUA_DE_DIONISIO,RICHARD73@HOTMAIL.COM +669,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,23-Oct-20,DEBORAH_TATE,F,19-Jun-85,ANTONIO_DE_LOS_HEROS,MORGAN62@YAHOO.COM +670,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,23-Oct-20,JESSICA_LAMBERT,F,08-Nov-29,BADANO,MEGANWEBER@YAHOO.COM +671,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,23-Oct-20,DANIEL_MEZA,M,29-Aug-65,AGUAS_CALIENTES,ZALLEN@GMAIL.COM +672,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,23-Oct-20,PAMELA_ROBLES,F,26-Jan-96,ALIJILAN,WILLIAMBARRY@HOTMAIL.COM +673,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,23-Oct-20,BRIAN_HOWARD,M,19-Oct-02,CAPIOVI,JACOB99@HOTMAIL.COM +674,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,23-Oct-20,SUSAN_RIVERA,F,26-Feb-23,DEFERRARI,TIMOTHY67@YAHOO.COM +675,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,23-Oct-20,BRETT_ROY,M,05-Feb-45,AGUA_CERCADA,MADISONKELLY@HOTMAIL.COM +676,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,23-Oct-20,SHAWN_PARKS,M,26-May-24,ALMACEN_EL_DESCANSO,RANDALL72@YAHOO.COM +677,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,23-Oct-20,KATRINA_MITCHELL,F,05-Sep-94,CAILOMUTA,DGIBSON@YAHOO.COM +678,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,23-Oct-20,JOHN_KAISER,M,29-Jun-25,ALTO_BLANCO,LISA40@YAHOO.COM +679,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,23-Oct-20,ERIC_FITZPATRICK,M,23-Oct-17,AMENABAR,HARRISONCYNTHIA@GMAIL.COM +680,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,24-Oct-20,MELISSA_GLOVER,F,12-Jan-18,ADELA,THOMAS45@HOTMAIL.COM +681,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,24-Oct-20,RONALD_CASE,M,24-Mar-27,ALEGRE,GRAHAMJAMES@YAHOO.COM +682,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,24-Oct-20,JUDY_MARTINEZ,F,31-Aug-73,CAMPO_DE_LOS_TOROS,PATRICIA33@YAHOO.COM +683,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,24-Oct-20,ROSE_FRAZIER,F,13-Sep-65,ASCENCION,IJOHNSON@YAHOO.COM +684,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,24-Oct-20,GREGORY_MORRIS,M,20-Feb-97,ALPACHIRI,MILLERJOSHUA@YAHOO.COM +685,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,24-Oct-20,KEVIN_ATKINSON,M,14-Feb-11,BERISSO,CGONZALES@HOTMAIL.COM +686,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,24-Oct-20,MISTY_BARBER,F,17-Jun-97,COLONIA_BELLA_VISTA,ANTHONYDENNIS@GMAIL.COM +687,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,24-Oct-20,NATHAN_SCOTT,M,17-Jul-96,2_DE_MAYO,NROSE@HOTMAIL.COM +688,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,24-Oct-20,SHANE_KELLY,M,19-Aug-32,FAVELLI,CSANCHEZ@YAHOO.COM +689,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,24-Oct-20,CARLOS_EVANS,M,12-Jun-11,ESTRADA,DODSONTERRI@YAHOO.COM +690,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,24-Oct-20,STEVEN_BERRY,M,11-Mar-09,ALMIRANTE_IRIZAR,FERRELLJASON@HOTMAIL.COM +691,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,24-Oct-20,MARY_TORRES,F,04-Apr-94,RAFAEL_CALZADA,GRUIZ@GMAIL.COM +692,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,24-Oct-20,DANIELLE_RODRIGUEZ,F,17-Aug-72,BAÑOS_DE_LA_LAJA,WALKERDANA@YAHOO.COM +693,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,24-Oct-20,MALLORY_MARTINEZ,F,06-Jan-36,BARKER,DANA01@HOTMAIL.COM +694,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,25-Oct-20,AARON_RIOS,M,14-Dec-58,ALVAREZ,CHAVEZAMANDA@GMAIL.COM +695,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,25-Oct-20,SCOTT_MAYS,M,09-Nov-28,ALTA_ITALIA,MEREDITHPENA@YAHOO.COM +696,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,25-Oct-20,MICHELE_CAIN,F,16-Jul-07,CHIVILCOY,GRACE89@GMAIL.COM +697,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,25-Oct-20,RONALD_WILLIAMS,M,26-Jun-84,ALTO_DE_LAS_ARAÑAS,GERALDSANCHEZ@HOTMAIL.COM +698,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,25-Oct-20,MISTY_DAVIS,F,27-Feb-29,KILOMETRO_47,EMILYLEE@HOTMAIL.COM +699,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,25-Oct-20,ROBERT_BOYD,M,14-Apr-11,BARRIO_FERRI,SANDRASANCHEZ@HOTMAIL.COM +700,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,25-Oct-20,RAYMOND_HUBBARD,M,15-Jul-62,COLONIA_MATILDE,CHARLESRAMIREZ@HOTMAIL.COM +701,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,25-Oct-20,DAVID_WOODS,M,20-May-73,ISLA_GRAN_MALVINA,FRAMIREZ@GMAIL.COM +702,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,25-Oct-20,LISA_OROZCO,F,23-Oct-54,ARMINDA,ZHESTER@GMAIL.COM +703,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,25-Oct-20,MEGAN_WARD,F,14-Jan-15,EL_CARRETERO,CBRANCH@HOTMAIL.COM +704,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,25-Oct-20,STEPHANIE_HOOVER,F,04-Sep-06,ARROYO_BURGOS,FRANK77@YAHOO.COM +705,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,25-Oct-20,JONATHAN_CHUNG,M,15-Mar-49,AGUSTIN_MOSCONI,DENISE87@YAHOO.COM +706,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,25-Oct-20,KEVIN_ALI,M,07-Jul-51,AMANA,PHILLIP59@GMAIL.COM +707,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,25-Oct-20,GARY_WRIGHT,M,27-Oct-79,CASABLANCA,SSTEWART@YAHOO.COM +708,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,25-Oct-20,DAWN_WARNER,F,18-Apr-27,CHEROGUITA,CURTISCHERRY@YAHOO.COM +709,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,25-Oct-20,DAVID_POPE,M,08-Dec-13,LA_PRIMAVERA,CHALL@GMAIL.COM +710,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,26-Oct-20,EILEEN_FORD,F,18-May-13,COLONIA_BOMBAL,SANDERSANDREA@GMAIL.COM +711,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,26-Oct-20,KAREN_BROWN,F,06-Jul-45,17_DE_AGOSTO,RMASSEY@GMAIL.COM +712,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,26-Oct-20,CYNTHIA_DAVENPORT,F,26-Jul-64,ALZAGA,DAVIDMALONE@YAHOO.COM +713,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,26-Oct-20,MR._ERIC_JACKSON_IV,M,17-Aug-17,BERNAL_ESTE,KAREN56@YAHOO.COM +714,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,27-Oct-20,SARA_HOLLAND,F,29-Dec-18,COSTA_DEL_ESTE,JEFFREYFITZGERALD@GMAIL.COM +715,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,27-Oct-20,JAVIER_BURGESS,M,15-Jan-14,COLONIA_PUJOL,JOSHUARICHARDSON@YAHOO.COM +716,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,27-Oct-20,CHAD_FOX,M,15-Jun-47,ALONGO,JAMESMILLER@YAHOO.COM +717,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,27-Oct-20,CARL_PRICE,M,22-Aug-80,SALDUNGARAY,ANDERSONMICHAEL@HOTMAIL.COM +718,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,27-Oct-20,SARAH_EDWARDS,F,21-Mar-55,AGUADITA,JOHNROSE@GMAIL.COM +719,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,27-Oct-20,MIRANDA_RILEY,F,02-Sep-07,BARRIO_VILLA_SALADILLO,LNASH@GMAIL.COM +720,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,27-Oct-20,SCOTT_HICKS,M,16-May-66,CAMPO_QUIRNO,CRYSTAL67@GMAIL.COM +721,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,27-Oct-20,BRIAN_LOPEZ,M,06-Apr-22,AGUA_AMARGA,MIGUEL54@GMAIL.COM +722,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,27-Oct-20,SAMANTHA_STONE,F,30-Aug-87,AERO_CLUB_CANAL,BSIMMONS@YAHOO.COM +723,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,27-Oct-20,JASON_SPARKS,M,02-Apr-13,EL_PIMPOLLO,TAMMY47@HOTMAIL.COM +724,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,27-Oct-20,PHYLLIS_GONZALEZ,F,12-Mar-89,CAMPO_ARISTIMUÑO,TIMOTHY26@GMAIL.COM +725,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,27-Oct-20,CHRISTIAN_GARCIA,M,21-Oct-19,COPACABANA,ELIZABETHSAWYER@HOTMAIL.COM +726,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,27-Oct-20,DAVID_BASS,M,07-May-14,ALFALAD,SCOTTBENNETT@GMAIL.COM +727,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,27-Oct-20,JACK_MARTIN,M,25-Sep-13,CIUDAD_MADERO,MICHAELADAMS@YAHOO.COM +728,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,28-Oct-20,JOSHUA_HUDSON,M,21-Mar-18,ARROYO_DEL_PESCADO,ERICWILLIAMS@GMAIL.COM +729,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,28-Oct-20,TAMMY_THOMPSON,F,19-Jul-67,LAS_TONINAS,MKENNEDY@GMAIL.COM +730,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,28-Oct-20,DR._LANCE_MAYO,M,29-Sep-75,6_DE_SEPTIEMBRE,UKING@YAHOO.COM +731,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,28-Oct-20,MATTHEW_HOFFMAN,M,14-May-14,CASALINS,CLEONARD@HOTMAIL.COM +732,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,28-Oct-20,MICHAEL_HAMILTON,M,06-Jun-51,AMERICA_UNIDA,ROBERTSLISA@GMAIL.COM +733,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,28-Oct-20,ALYSSA_MARTINEZ,F,08-Oct-57,EREZCANO,JULIE21@YAHOO.COM +734,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,28-Oct-20,MRS._ASHLEY_MILLER,F,14-Jul-91,CORONEL_ISLEÑOS,WJIMENEZ@HOTMAIL.COM +735,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,28-Oct-20,KRISTEN_ARIAS_DDS,F,05-Oct-36,ACASSUSO,NICHOLASSHEPHERD@GMAIL.COM +736,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,28-Oct-20,TAMARA_KELLEY,F,29-Oct-80,BAÑADO_VERDE,CATHERINEROBERSON@HOTMAIL.COM +737,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,28-Oct-20,GABRIELLE_WOOD,F,08-May-42,ISLA_GRAN_MALVINA,KMORRIS@GMAIL.COM +738,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,28-Oct-20,ANDREA_KIRBY,F,17-Nov-63,10_DE_MAYO,KRISTIE75@GMAIL.COM +739,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,28-Oct-20,EMMA_WILLIAMS,F,13-Jul-48,CARMEN,RHARVEY@GMAIL.COM +740,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,29-Oct-20,JESSICA_WALSH,F,08-May-84,PIAMONTE,SUSAN41@GMAIL.COM +741,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,29-Oct-20,DERRICK_MILLER,M,23-Oct-18,BATELITO,PREED@GMAIL.COM +742,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,29-Oct-20,VINCENT_TRUJILLO,M,23-Mar-10,CALDERON,DOUGLAS08@YAHOO.COM +743,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,29-Oct-20,KENNETH_PARK,M,11-Jul-59,COLONIA_CELINA,AMANDA28@GMAIL.COM +744,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,29-Oct-20,BRIDGET_GARCIA,F,02-Jul-54,ACEILAN,JGOMEZ@HOTMAIL.COM +745,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,29-Oct-20,CYNTHIA_PEREZ,F,10-Apr-26,GOBERNADOR_CRESPO,JARED06@GMAIL.COM +746,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,29-Oct-20,MICHELLE_PARKS,F,01-Nov-04,ALEGRIA,WSUTTON@YAHOO.COM +747,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,29-Oct-20,MRS._JODI_LAMBERT_DVM,F,22-Dec-60,BELLA_VISTA,FPAUL@YAHOO.COM +748,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,29-Oct-20,LISA_SNYDER,F,31-Jul-21,AGUA_COLORADA,COREY03@HOTMAIL.COM +749,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,29-Oct-20,KAREN_GORDON,F,29-Nov-99,COLONIA_SANTA_ROSA,ROBERTTHOMAS@HOTMAIL.COM +750,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,29-Oct-20,ANDREW_CLARK,M,24-Jun-19,LA_TORRECITA,GRAHAMJUSTIN@YAHOO.COM +751,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,29-Oct-20,BRIAN_BYRD,M,17-Jul-21,ARROYO_DE_LA_CRUZ,NELSONSANDRA@HOTMAIL.COM +752,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,29-Oct-20,TAYLOR_CHAVEZ,F,24-Dec-17,ALTO_LAS_LECHUZAS,HANNAHPETERSON@YAHOO.COM +753,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,29-Oct-20,DAWN_GOOD,F,10-Jun-21,CIUDAD_EVITA,VINCENTKATHY@HOTMAIL.COM +754,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,29-Oct-20,ROBERT_BROWN,M,06-Sep-81,AGUAS_CALIENTES,SHELTONBOBBY@HOTMAIL.COM +755,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,29-Oct-20,KENNETH_ROBINSON,M,01-Sep-17,COLONIA_RIVAS,UCOCHRAN@YAHOO.COM +756,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,29-Oct-20,APRIL_KING,F,05-Sep-10,COLONIA_BARON_HIRSCH,KATHERINE33@GMAIL.COM +757,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,30-Oct-20,NATHAN_MARTIN,M,24-Nov-90,ALGARROBITOS_1RO,HANSENBRYAN@HOTMAIL.COM +758,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,30-Oct-20,ANGELA_BISHOP,F,21-May-27,2_DE_JULIO,NICHOLAS82@HOTMAIL.COM +759,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,30-Oct-20,ASHLEY_WRIGHT,F,25-Jan-59,CAMPO_HORQUESCO,EBRAY@YAHOO.COM +760,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,30-Oct-20,CHARLES_MASON,M,03-Apr-46,BERNAL_ESTE,CSNYDER@YAHOO.COM +761,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,30-Oct-20,ERIC_JOHNSON,M,01-Aug-98,JOSE_LEON_SUAREZ,JANET67@GMAIL.COM +762,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,30-Oct-20,JAMES_NAVARRO_DVM,M,30-Jul-30,CARLOS_CASARES,ANGELA49@YAHOO.COM +763,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,30-Oct-20,KAREN_OBRIEN,F,01-Jul-35,ACARAGUA,TRACYPARK@YAHOO.COM +764,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,30-Oct-20,CHRISTOPHER_GONZALES,M,19-May-68,ANTONIO_DE_LOS_HEROS,JOSE32@YAHOO.COM +765,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,30-Oct-20,CONNOR_GOLDEN,M,26-Jul-88,ARANGUREN,LHINES@YAHOO.COM +766,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,30-Oct-20,BOBBY_WANG,M,30-Oct-01,EMPALME_SAN_CARLOS,ROMANDANIEL@YAHOO.COM +767,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,30-Oct-20,THOMAS_SANCHEZ,M,07-May-80,ADOLFO_VAN_PRAET,TODD46@HOTMAIL.COM +768,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,30-Oct-20,CYNTHIA_NICHOLS,F,06-Jan-18,CORRENTOSO,CERICKSON@HOTMAIL.COM +769,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,30-Oct-20,KEVIN_RAMIREZ,M,16-Jan-06,BLANCA_GRANDE,AGONZALES@YAHOO.COM +770,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,30-Oct-20,KATHRYN_FIGUEROA,F,09-Feb-01,AMBERES,ROY52@GMAIL.COM +771,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,30-Oct-20,STEPHEN_ROSS,M,26-Feb-40,INGENIERO_BALBIN,SARAHSULLIVAN@YAHOO.COM +772,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,30-Oct-20,MICHELLE_PATTERSON,F,10-Feb-52,AGUA_RICA,CROSALES@HOTMAIL.COM +773,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,30-Oct-20,DEBRA_FLORES,F,26-Nov-15,COLONIA_ZAMBUNGO,SANDRALARSON@YAHOO.COM +774,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,30-Oct-20,HEATHER_CHAPMAN,F,23-Jan-02,COLONIA_LEIVA,ANTHONY73@YAHOO.COM +775,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,31-Oct-20,SARA_DAVIS,F,03-Apr-82,PALANTELEN,BARBARALOPEZ@GMAIL.COM +776,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,31-Oct-20,VALERIE_JACKSON,F,21-Nov-12,ESTACION_LAGO_EPECUEN,ALBERT72@YAHOO.COM +777,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,31-Oct-20,JOHN_ROGERS,M,05-Jul-00,COLONIA_EL_POTRERO,JESSICAHARRIS@GMAIL.COM +778,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,31-Oct-20,ROBERT_HUTCHINSON,M,02-Oct-78,BOCAS,HAROLD52@GMAIL.COM +779,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,31-Oct-20,LISA_LEWIS,F,08-Jan-04,CAMPO_ANDINO,MARTINEZDIANE@GMAIL.COM +780,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,31-Oct-20,APRIL_DAVIS,F,19-Jun-09,RECALDE,JOHNSONMELISSA@HOTMAIL.COM +781,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,31-Oct-20,KEVIN_ELLISON,M,02-Mar-49,ANDRADE,ILEWIS@HOTMAIL.COM +782,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,31-Oct-20,KATHLEEN_SHARP,F,11-Apr-68,AGUADITAS,GATESNANCY@GMAIL.COM +783,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,31-Oct-20,MIGUEL_WOLF,M,02-Dec-41,CORTINES,EBLANCHARD@GMAIL.COM +784,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,31-Oct-20,ELIZABETH_LAWRENCE,F,31-Mar-85,CHACRAS_VIEJAS,PCLARK@HOTMAIL.COM +785,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,31-Oct-20,JERRY_HORTON,M,15-Jan-65,COLONIA_MENDEZ_BAR,TROY11@GMAIL.COM +786,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,31-Oct-20,DEAN_WARD,M,03-Oct-76,EL_CENIZO,QRAMIREZ@GMAIL.COM +787,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,31-Oct-20,ROBERT_HENDERSON,M,16-Apr-25,ALTO_DE_LEIVA,BROOKEROBBINS@GMAIL.COM +788,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,01-Nov-20,SARAH_JONES,F,18-Jul-39,CONDARCO,WATSONANGELA@GMAIL.COM +789,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,01-Nov-20,WILLIAM_GOMEZ,M,16-Mar-97,EMPALME_VILLA_CONSTITUCION,AMANDA90@YAHOO.COM +790,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,01-Nov-20,BRIANA_MORGAN,F,12-Mar-21,PONTAUT,SPENCEPETER@GMAIL.COM +791,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,01-Nov-20,JEFFREY_BENDER,M,12-Nov-17,COLONIA_LA_YERBA,CHRISTOPHER36@YAHOO.COM +792,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,01-Nov-20,APRIL_HAWKINS_MD,F,28-Oct-67,BORDENAVE,TUCKERKRISTIN@YAHOO.COM +793,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,01-Nov-20,VICTOR_GRAY,M,16-Apr-71,CALFUCURA,ELLISJOHNNY@HOTMAIL.COM +794,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,01-Nov-20,JAMES_DAVIS,M,28-Dec-97,ARTURO_ALMARAZ,AARONJONES@GMAIL.COM +795,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,01-Nov-20,DAKOTA_WANG,M,25-May-57,CAÑADA_SECA,CHRISTOPHERHOGAN@HOTMAIL.COM +796,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,01-Nov-20,SEAN_LAMBERT,M,21-Jul-62,ESTANCIA_SANTA_CATALINA,OBROWN@YAHOO.COM +797,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,01-Nov-20,MARTIN_SHERMAN,M,07-Jan-62,LA_VITICOLA,JHORN@GMAIL.COM +798,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,01-Nov-20,MEGAN_ANDERSON,F,04-Oct-78,EL_GUALICHO,THOMPSONAPRIL@HOTMAIL.COM +799,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,01-Nov-20,DAVID_MURRAY,M,13-Feb-99,COLONIA_DELFINO,LISACASTRO@YAHOO.COM +800,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,01-Nov-20,TAMMY_RODRIGUEZ,F,24-Sep-96,BATELITO,WESTALEXIS@YAHOO.COM +801,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,02-Nov-20,PATRICIA_BROWN,F,11-Nov-96,LOS_LAURELES,EROBERTS@YAHOO.COM +802,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,02-Nov-20,ADAM_CLARK,M,22-Sep-89,CHANILAO,YMILLS@GMAIL.COM +803,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,02-Nov-20,GAIL_PALMER,F,14-Dec-49,SAN_JOSE_DE_PIEDRA_BLANCA,GLANE@YAHOO.COM +804,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,02-Nov-20,KATHLEEN_ANDERSON,F,26-Dec-95,ALTO_CALILEGUA,WILCOXCAITLIN@YAHOO.COM +805,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,02-Nov-20,JACKIE_TAYLOR,F,20-Apr-41,KILOMETRO_208,PATRICIA76@HOTMAIL.COM +806,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,02-Nov-20,MISS_MARY_GRANT,F,17-Mar-91,BONPLAND,IOWEN@GMAIL.COM +807,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,02-Nov-20,KATHERINE_ANDERSON,F,31-Jan-35,AMBAS_PUNTILLAS,OTHOMPSON@HOTMAIL.COM +808,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,02-Nov-20,JEREMY_MOORE,M,18-Nov-21,COLMAN,WVALDEZ@HOTMAIL.COM +809,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,02-Nov-20,STACY_SALAZAR,F,23-Apr-13,ESMERALDA,DARIUS52@GMAIL.COM +810,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,02-Nov-20,ERICA_SMITH,F,25-Sep-41,KILOMETRO_77,JOCELYN41@GMAIL.COM +811,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,02-Nov-20,DYLAN_DAVIS,M,16-Jun-32,COLONIA_BOMBAL_Y_TABANERA,ULYNCH@GMAIL.COM +812,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,02-Nov-20,MELODY_FOSTER,F,14-Oct-15,CUSHAMEN,DODSONMICHAEL@GMAIL.COM +813,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,03-Nov-20,CALEB_GARCIA,M,24-Jun-09,CAPILLA_GUADALUPE_NORTE,JUSTIN49@GMAIL.COM +814,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,03-Nov-20,BRANDON_LOPEZ,M,03-Jul-64,CAMPO_CHARO,JULIE33@HOTMAIL.COM +815,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,03-Nov-20,TIMOTHY_WEBSTER,M,14-Mar-24,CACHIYUYAL,NICOLE22@YAHOO.COM +816,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,03-Nov-20,MARGARET_SMITH,F,26-Dec-41,CAÑADA_DE_LAS_VACAS,DAVIESEDDIE@YAHOO.COM +817,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,03-Nov-20,SHANNON_WALSH,F,14-Aug-04,ASUNCION_MARIA,SBAKER@HOTMAIL.COM +818,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,03-Nov-20,BRIAN_MORGAN,M,02-Feb-04,ARROYO_HONDO,DANIELWEST@HOTMAIL.COM +819,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,03-Nov-20,KAREN_GRANT,F,23-Jul-04,AEROPUERTO_EZEIZA,VEVANS@YAHOO.COM +820,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,03-Nov-20,JESSICA_MUNOZ,F,04-Jul-29,AGUA_BLANCA,VICTORIA81@GMAIL.COM +821,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,03-Nov-20,CHAD_HOWELL,M,22-Jan-18,AGUAY,IPARSONS@YAHOO.COM +822,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,03-Nov-20,SARAH_PHILLIPS,F,24-Sep-16,CAMINERA_SAMBOROMBON,PATRICIA70@HOTMAIL.COM +823,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,03-Nov-20,CHRISTOPHER_HARTMAN,M,24-Feb-44,CAÑADITA,SHANE64@YAHOO.COM +824,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,03-Nov-20,LISA_HENSON,F,19-Jul-78,CARILO,CYNTHIAHOWARD@YAHOO.COM +825,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,03-Nov-20,PATRICK_WRIGHT,M,08-Feb-23,PORVENIR,PAULA78@GMAIL.COM +826,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,03-Nov-20,EDWARD_AGUIRRE,M,03-Dec-62,VILLA_SAUCE,ANN60@YAHOO.COM +827,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,03-Nov-20,MEGHAN_WALLACE,F,03-Mar-81,ARROYO_TOMAS,SCOTTTRAN@GMAIL.COM +828,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,04-Nov-20,ROBIN_CARDENAS,F,03-Aug-84,COLONIA_GOBERNADOR_AYALA,OMCDANIEL@YAHOO.COM +829,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,04-Nov-20,SARA_GARCIA,F,14-Aug-63,AZUL,FULLERROBERTA@YAHOO.COM +830,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,04-Nov-20,ERIKA_CARTER_MD,F,22-Jun-56,ALMIRANTE_BROWN,GLORIA98@YAHOO.COM +831,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,04-Nov-20,MELISSA_HILL,F,02-Jun-85,BATHURST_ESTACION,AKELLY@HOTMAIL.COM +832,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,04-Nov-20,ROBERT_BOOKER,M,17-Mar-53,EL_LENGUARAZ,JAMES26@HOTMAIL.COM +833,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,04-Nov-20,NICHOLAS_SMITH,M,25-Aug-45,BAGUAL,UFOSTER@YAHOO.COM +834,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,04-Nov-20,TIMOTHY_WILLIAMS,M,25-May-50,DE_BRUYN,CHALL@YAHOO.COM +835,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,04-Nov-20,JUSTIN_HAMPTON,M,08-Oct-60,CHUMBICHA,NICOLE88@HOTMAIL.COM +836,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,05-Nov-20,MELANIE_FRANCO,F,27-Nov-72,BATAVIA,MARSHALLAMBER@GMAIL.COM +837,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,05-Nov-20,KATHERINE_HAYNES,F,11-Aug-02,BLAS_DURAÑONA,DIAZBRETT@YAHOO.COM +838,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,05-Nov-20,RYAN_HILL,M,21-Sep-77,EL_MOLLE,DANIELANDREA@HOTMAIL.COM +839,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,05-Nov-20,NATHAN_MORRIS,M,22-May-47,COLONIA_HARDY,ELIZABETH81@HOTMAIL.COM +840,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,05-Nov-20,JEFFREY_HAHN,M,17-Jan-20,ANAHI,PATELMICHAEL@GMAIL.COM +841,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,05-Nov-20,LUIS_GUERRERO,M,22-Jan-14,EL_CIPRES,ANDREW54@GMAIL.COM +842,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,05-Nov-20,SCOTT_THOMAS,M,10-Nov-21,AGUADA_DE_LAS_TEJAS,AWEST@YAHOO.COM +843,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,05-Nov-20,JAMIE_BAXTER,F,10-Nov-11,EL_CIPRES,MARK37@GMAIL.COM +844,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,05-Nov-20,BRADLEY_ROBERTS,M,27-Aug-90,BARADERO,GMILLER@GMAIL.COM +845,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,05-Nov-20,SUZANNE_RAMSEY,F,26-Sep-42,COLONIA_ROCA,DMORENO@HOTMAIL.COM +846,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,05-Nov-20,JONATHAN_HART,M,14-Feb-13,CHAVARRIA,MALIK35@GMAIL.COM +847,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,05-Nov-20,COLLEEN_OLSON,F,03-Oct-09,COSTA_DEL_RIO_AZUL,DONNA21@HOTMAIL.COM +848,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,05-Nov-20,JENNIFER_SANCHEZ,F,03-Jan-42,ALPASINCHE,FOSTERGARY@GMAIL.COM +849,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,05-Nov-20,LAUREN_REESE,F,28-Apr-78,BERMUDEZ,CHRISTOPHER30@YAHOO.COM +850,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,06-Nov-20,KIMBERLY_BLEVINS,F,25-Mar-70,AMBROSIO_P_LEZICA,CHARLES51@YAHOO.COM +851,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,06-Nov-20,MELISSA_REED,F,17-May-62,LA_PUNTA,LAWRENCE13@HOTMAIL.COM +852,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,06-Nov-20,DANIEL_REED,M,15-Dec-52,CAMPO_LA_FLOR_LOS_RALOS,MILLERLORI@HOTMAIL.COM +853,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,06-Nov-20,VANESSA_CHAVEZ,F,17-Sep-95,ALEGRE,UHALEY@HOTMAIL.COM +854,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,06-Nov-20,ANNA_FUENTES,F,20-Feb-90,CAÑADON_LEON,XPARKER@GMAIL.COM +855,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,06-Nov-20,KATHY_WILLIAMS,F,19-Jan-27,AGUA_COLORADA,BROOKE36@HOTMAIL.COM +856,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,06-Nov-20,BRITTANY_HOWARD,F,23-Jan-09,PONTAUT,GREGORY44@YAHOO.COM +857,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,06-Nov-20,JENNIFER_SCHWARTZ,F,19-Jul-21,EL_PINO,HCAMACHO@HOTMAIL.COM +858,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,06-Nov-20,JESSICA_SCHNEIDER,F,01-Jul-23,ANCON,ROBERT40@YAHOO.COM +859,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,06-Nov-20,LEONARD_AVILA,M,28-Dec-12,ARAÑITA,RAMIREZCHRISTINA@HOTMAIL.COM +860,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,06-Nov-20,ROBERT_BROWN,M,11-Feb-09,ARROYO_TOMAS,ROBINPERKINS@YAHOO.COM +861,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,06-Nov-20,MALIK_SHEPHERD,M,30-Jan-11,COLONIA_BARON,CAROL37@HOTMAIL.COM +862,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,06-Nov-20,JACOB_DAVIS,M,08-Apr-03,COMANDANTE_LEAL,MARIAFERGUSON@HOTMAIL.COM +863,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,06-Nov-20,SARAH_HAMILTON,F,26-Nov-60,FUNKE,KAYLA99@GMAIL.COM +864,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,06-Nov-20,SANDRA_COOPER,F,05-Oct-03,CARAGUATAY,THALL@YAHOO.COM +865,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,06-Nov-20,JEREMY_SMITH_MD,M,06-Feb-73,ABRA_GUAZU,KATHERINE12@HOTMAIL.COM +866,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,06-Nov-20,JONATHAN_REYNOLDS,M,08-Nov-16,CUARTEL_VII,LARRYDAVIS@HOTMAIL.COM +867,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,07-Nov-20,RICARDO_MORRIS,M,20-Jan-62,BONIFACIO,QDUDLEY@HOTMAIL.COM +868,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,07-Nov-20,KIMBERLY_KANE,F,11-Feb-77,CHAMICAL,RACHELBROWN@HOTMAIL.COM +869,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,07-Nov-20,STEPHEN_BRADLEY,M,04-Aug-32,AVELLANEDA,MONROEANDREW@GMAIL.COM +870,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,07-Nov-20,CHRISTINA_PARKER,F,05-Jul-98,23_DE_AGOSTO,MICHAELWILLIAMS@GMAIL.COM +871,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,07-Nov-20,LORI_BISHOP,F,27-Feb-09,ARRASCAETA,MIRANDAJONES@HOTMAIL.COM +872,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,07-Nov-20,CARRIE_DAY,F,27-Apr-11,OCHENTA_Y_CUATRO,OTATE@YAHOO.COM +873,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,07-Nov-20,EMILY_COOKE,F,28-Aug-77,SIERRA_DE_LA_VENTANA,MEGAN15@YAHOO.COM +874,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,07-Nov-20,HERBERT_SULLIVAN,M,10-Mar-17,COSTA_BONITA_BALNEARIO,BILLYDIXON@HOTMAIL.COM +875,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,07-Nov-20,LOUIS_SMITH,M,24-Nov-33,COSTA_GRANDE,JORDANROGERS@GMAIL.COM +876,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,07-Nov-20,ANTHONY_THOMAS,M,24-Apr-19,ALMIRANTE_BROWN,SHARONFARLEY@YAHOO.COM +877,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,07-Nov-20,RHONDA_THOMPSON,F,30-Nov-08,MATHEU,DTERRELL@GMAIL.COM +878,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,07-Nov-20,BRANDON_OBRIEN,M,14-Aug-02,ATENCIO,CRYSTAL85@GMAIL.COM +879,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,08-Nov-20,BRANDI_FUENTES,F,15-Apr-01,AMERICA,QMOYER@HOTMAIL.COM +880,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,08-Nov-20,RONALD_BRAUN,M,16-Jul-33,BAJO_LA_CANCHA,PAIGEGOODWIN@HOTMAIL.COM +881,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,08-Nov-20,DAVID_STARK,M,30-Apr-28,COLONIA_ENSANCHE_SAUCE,ALEXANDERBULLOCK@YAHOO.COM +882,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,08-Nov-20,CLIFFORD_MILLS,M,06-Sep-14,FAVELLI,HEATHER68@HOTMAIL.COM +883,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,08-Nov-20,JARED_SIMPSON,M,29-May-92,AGUARA_CUA,DEREKNELSON@GMAIL.COM +884,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,08-Nov-20,DR._TIMOTHY_RIVERA,M,10-Mar-12,BONIFACIO,CODY30@GMAIL.COM +885,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,08-Nov-20,LESLIE_SCHNEIDER,F,23-Jul-48,ESTACION_CHRISTOPHERSEN,GREGORYCARLSON@HOTMAIL.COM +886,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,08-Nov-20,LISA_MARTINEZ,F,25-Aug-67,ABRA_EL_CANDADO,ROSE80@HOTMAIL.COM +887,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,08-Nov-20,ALYSSA_HERNANDEZ,F,20-Sep-11,ABRA,HUGHESJESSICA@GMAIL.COM +888,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,08-Nov-20,MRS._ASHLEY_MCCONNELL,F,06-Feb-76,11_DE_SEPTIEMBRE,RUTHCARTER@YAHOO.COM +889,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,08-Nov-20,COREY_WOOD,M,02-Jul-34,AGUARA_CUA,AUDREYBEST@YAHOO.COM +890,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,08-Nov-20,HEATHER_HOLMES,F,01-Nov-97,CARBOMETAL,JENNIFER37@HOTMAIL.COM +891,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,08-Nov-20,SARAH_CRUZ,F,19-Nov-49,ALDECON,RHONDACARLSON@HOTMAIL.COM +892,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,08-Nov-20,PAULA_JOHNS_DVM,F,17-Nov-01,SAN_PEDRO_DE_IRUYA,ZCALDWELL@YAHOO.COM +893,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,09-Nov-20,ANGELA_LEWIS,F,25-Aug-70,CAMPO_LA_RIVIERE,LHICKS@HOTMAIL.COM +894,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,09-Nov-20,SAMUEL_DAVIDSON,M,13-Apr-53,ARROYO_CANELON,SHAWNWHITE@HOTMAIL.COM +895,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,09-Nov-20,JASON_MCDONALD,M,09-Sep-14,LA_UNION,CODYGILMORE@HOTMAIL.COM +896,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,09-Nov-20,TRACY_CORTEZ,F,03-May-80,COLONIA_EL_AGUARA,KBARNES@YAHOO.COM +897,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,09-Nov-20,KARINA_HOGAN,F,02-Mar-22,DOS_HERMANAS,JASON43@YAHOO.COM +898,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,09-Nov-20,AMBER_RODRIGUEZ_MD,F,22-Jul-13,PUNTA_DE_LOS_LLANOS,YANGMARC@YAHOO.COM +899,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,09-Nov-20,KATHERINE_JOHNSON,F,10-Sep-05,BALNEARIO_LOS_ANGELES,PSOTO@YAHOO.COM +900,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,09-Nov-20,MELANIE_COX,F,02-Jul-67,ALGARROBAL,CASSANDRAMEYERS@HOTMAIL.COM +901,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,09-Nov-20,LAUREN_SHEPARD,F,02-Dec-14,EST_JAUREGUI_VA_FLANDRIA,BPETERSON@HOTMAIL.COM +902,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,09-Nov-20,JOANNA_SANCHEZ,F,12-Oct-88,APEADERO_QUIROGA,KMONTGOMERY@HOTMAIL.COM +903,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,09-Nov-20,RICHARD_NGUYEN,M,07-Jun-92,ALLEN,JOHNSONCHRISTINE@YAHOO.COM +904,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,09-Nov-20,EMILY_SCHMIDT,F,05-Mar-67,LA_DORITA,JENNIFER20@HOTMAIL.COM +905,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,09-Nov-20,NICOLE_CARTER,F,18-Feb-69,AARON_CASTELLANOS,JASONGREEN@YAHOO.COM +906,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,10-Nov-20,SHERRI_FRY,F,23-Jul-97,GARRO,WLAWSON@HOTMAIL.COM +907,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,10-Nov-20,SANDRA_NORMAN,F,18-Jan-09,HAEDO,KCOHEN@HOTMAIL.COM +908,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,10-Nov-20,SEAN_MENDOZA,M,21-May-13,CAMPO_CHARO,LARRY27@GMAIL.COM +909,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,10-Nov-20,AARON_PRICE,M,10-Mar-29,BME_BAVIO_GRAL_MANSILLA,BRANDTRENEE@GMAIL.COM +910,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,10-Nov-20,JOANN_TURNER,F,11-May-20,MERCADO_CENTRAL,SCOTTGENTRY@HOTMAIL.COM +911,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,10-Nov-20,MATTHEW_HOLT,M,17-Sep-19,NONOGASTA,BARBARA91@GMAIL.COM +912,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,10-Nov-20,SARAH_ZAMORA,F,04-May-08,LIBANO,HMERCER@YAHOO.COM +913,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,10-Nov-20,WILLIAM_CARROLL,M,09-May-66,BAJO_DE_LOS_HUESOS,NELSONBRIAN@HOTMAIL.COM +914,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,10-Nov-20,KIMBERLY_EDWARDS,F,14-Dec-10,CAÑADA_ROSQUIN,CRAIGCAMPOS@GMAIL.COM +915,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,10-Nov-20,DENISE_MILLER,F,19-Jul-72,BECCAR,MARCRUSSELL@HOTMAIL.COM +916,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,10-Nov-20,MATTHEW_ARMSTRONG,M,11-May-88,CANTERA_AGUIRRE,OCOHEN@HOTMAIL.COM +917,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,10-Nov-20,CHRISTOPHER_REED,M,20-Sep-60,SIERRA_DE_LA_VENTANA,BKERR@GMAIL.COM +918,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,10-Nov-20,MR._VINCENT_SANTOS,M,02-Apr-13,GIRODIAS,BPHILLIPS@HOTMAIL.COM +919,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,10-Nov-20,JILLIAN_BURKE,F,05-May-09,CHAPANAY,LISAARMSTRONG@GMAIL.COM +920,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,10-Nov-20,DAVID_SMITH,M,26-Feb-61,LA_ISABEL,AUTUMNPAYNE@HOTMAIL.COM +921,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,10-Nov-20,CHRISTINA_DAVIS,F,19-Jun-83,ARRECHEA,YGARRETT@HOTMAIL.COM +922,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,11-Nov-20,HALEY_FULLER,F,05-Aug-84,DON_TORCUATO,STONEALEXANDER@HOTMAIL.COM +923,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,11-Nov-20,CHRISTOPHER_KIRK,M,20-Apr-47,ALDEA_SAN_ANDRES,WEEKSROBERT@HOTMAIL.COM +924,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,11-Nov-20,ROBERT_WRIGHT,M,04-Dec-77,ARROYO_CASTILLO,RICHARD83@YAHOO.COM +925,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,11-Nov-20,DREW_DAVIS,M,24-Jun-92,ALDEA_CHALECO,KATHLEEN94@YAHOO.COM +926,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,11-Nov-20,SUMMER_IRWIN,F,13-Dec-19,16_DE_JULIO,LEESUSAN@HOTMAIL.COM +927,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,11-Nov-20,JESSICA_RODRIGUEZ,F,17-May-30,COSTA_DEL_ESTE,MNELSON@HOTMAIL.COM +928,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,11-Nov-20,ROBERT_PATEL,M,22-Jan-84,CAMPO_MONTE_LA_VIRUELA,MICHAEL81@YAHOO.COM +929,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,11-Nov-20,MIKAYLA_STEVENS,F,01-May-40,CATARATAS_DEL_IGUAZU,FRANK35@HOTMAIL.COM +930,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,11-Nov-20,RYAN_GEORGE,M,25-Mar-25,BAHIA_LANGARA,JOSEPH71@HOTMAIL.COM +931,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,11-Nov-20,KRISTIN_ELLIS,F,01-Dec-96,ZONA_DELTA_SAN_FERNANDO,TRIOS@YAHOO.COM +932,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,11-Nov-20,SARA_CARR,F,25-Nov-66,ARANGUREN,CHRISSMITH@YAHOO.COM +933,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,11-Nov-20,SARAH_BYRD,F,03-Nov-15,ARTURO_VATTEONE,XAVIERDELACRUZ@HOTMAIL.COM +934,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,11-Nov-20,MICHAEL_TRAN,M,11-Nov-18,ESTACION_DE_ZOOTECNIA_B,FRANK85@YAHOO.COM +935,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,11-Nov-20,LORI_CONTRERAS,F,13-Sep-17,CUESTA_DEL_TERNERO,ETAYLOR@HOTMAIL.COM +936,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,12-Nov-20,MICHAEL_MADDOX,M,16-Sep-64,AYACUCHO,CHRISTOPHER67@GMAIL.COM +937,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,12-Nov-20,ELIZABETH_LIU,F,20-Apr-21,ALMACEN_CASTRO,PRESTONSCOTT@HOTMAIL.COM +938,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,12-Nov-20,ANTHONY_LOPEZ,M,21-Nov-93,PUNTA_LARA,MONROEBRENDA@YAHOO.COM +939,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,12-Nov-20,CHAD_GONZALES,M,16-Jun-41,ALVAREZ_DE_TOLEDO,ROBERT24@HOTMAIL.COM +940,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,12-Nov-20,AMY_MOLINA,F,27-Jul-75,VILLARS,CHRISTINE26@YAHOO.COM +941,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,12-Nov-20,JULIA_BROOKS,F,03-Mar-15,ALDO_BONZI,OLIVIASTEWART@GMAIL.COM +942,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,12-Nov-20,JOSHUA_CARTER,M,15-Aug-41,BARRO_NEGRO,GVILLANUEVA@HOTMAIL.COM +943,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,12-Nov-20,MATTHEW_DAVIS,M,18-Jun-50,10_DE_MAYO,WRIGHTKATHLEEN@HOTMAIL.COM +944,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,12-Nov-20,JORGE_PEREZ_IV,M,09-Jun-70,BANDERALO,JASMINERUSSELL@GMAIL.COM +945,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,12-Nov-20,SEAN_NEAL,M,31-Mar-59,BALDE_DE_LEYES,PHAMJONATHON@HOTMAIL.COM +946,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,12-Nov-20,ADAM_MAHONEY,M,09-May-91,AGUA_DE_DIONISIO,TWALSH@YAHOO.COM +947,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,12-Nov-20,HEATHER_CLARK,F,05-Aug-43,ACONQUIJA,GPAYNE@YAHOO.COM +948,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,12-Nov-20,RICHARD_DUARTE,M,19-May-74,CAÑADA_ROSQUIN,TPOLLARD@YAHOO.COM +949,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,12-Nov-20,MELISSA_HERNANDEZ,F,14-Dec-13,CHACRAS_VIEJAS,LEWISRANDY@GMAIL.COM +950,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,12-Nov-20,NICOLE_CHANEY,F,15-May-48,COLONIA_AVELLANEDA,EVAUGHN@HOTMAIL.COM +951,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,12-Nov-20,PAM_TORRES,F,23-Dec-14,LA_COLINA,DAVIDWALL@HOTMAIL.COM +952,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,12-Nov-20,VANESSA_LEON,F,24-Oct-32,BAHIA_CREEK,CBENTON@GMAIL.COM +953,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,12-Nov-20,JOSEPH_THOMAS,M,23-Sep-60,BLANDENGUES,ERICWATERS@HOTMAIL.COM +954,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,13-Nov-20,PAMELA_DAVIS,F,20-Nov-77,ANTA,ALLENMICHAEL@GMAIL.COM +955,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,13-Nov-20,MICHELE_RIVERA,F,18-Oct-09,CAÑADA_DE_LAS_VACAS,HELEN20@HOTMAIL.COM +956,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,13-Nov-20,JENNIFER_WILSON,F,09-Jul-57,ALTO_PENCOSO,SMITHMICHELLE@YAHOO.COM +957,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,13-Nov-20,KELLY_DAVIS,F,18-Aug-25,AGUA_GRANDE,JOSEPH37@HOTMAIL.COM +958,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,13-Nov-20,MATTHEW_TERRELL,M,17-Mar-91,RINCON_DE_MILBERG,ZIMMERMANAMANDA@GMAIL.COM +959,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,13-Nov-20,ERIC_SIMON,M,27-Aug-34,BARRIO_LA_LUISA,MICHAELADAMS@HOTMAIL.COM +960,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,13-Nov-20,JASON_HOWARD,M,04-Oct-09,GOUIN,BHULL@HOTMAIL.COM +961,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,13-Nov-20,DENISE_FLOYD,F,27-Aug-28,ANDERSON,ERIC14@YAHOO.COM +962,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,13-Nov-20,KENDRA_HILL,F,25-Jan-00,CAPDEPONT,CALEBSIMS@HOTMAIL.COM +963,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,13-Nov-20,EMILY_LEONARD,F,07-Jul-31,LOS_POLVORINES,EVANSROBIN@GMAIL.COM +964,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,13-Nov-20,MARY_PORTER,F,28-Jul-78,BASE_AERONAVAL_PUNTA_INDIO,RASMUSSENMARK@HOTMAIL.COM +965,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,13-Nov-20,MICHAEL_WEBSTER,M,17-Apr-56,CABI_MONDA,DAVILAJEFFREY@YAHOO.COM +966,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,13-Nov-20,ANA_WEBB,F,04-Apr-08,ABRA,WILLIAMSERIC@YAHOO.COM +967,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,13-Nov-20,JOSEPH_CLARK,M,24-Jan-86,EMPALME_VILLA_CONSTITUCION,LWILLIAMS@GMAIL.COM +968,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,14-Nov-20,TIMOTHY_DICKERSON,M,27-Mar-12,CAMPO_RODRIGUEZ,CHRISTOPHERMYERS@HOTMAIL.COM +969,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,14-Nov-20,JOHN_LEE,M,04-Aug-08,CLAUDIO_C_MOLINA,JOHN66@GMAIL.COM +970,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,14-Nov-20,DYLAN_WILLIAMS,M,01-Jan-80,BERNAL_ESTE,SANDERSRANDY@GMAIL.COM +971,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,14-Nov-20,KIMBERLY_COLLINS,F,05-May-59,AGUA_DE_DIONISIO,RTHOMAS@YAHOO.COM +972,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,14-Nov-20,GREGORY_STAFFORD,M,17-May-70,COLONIA_RIVAS,JOHN40@YAHOO.COM +973,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,14-Nov-20,EMILY_REYNOLDS,F,30-Aug-24,COLONIA_FLORENCIA,UGIBSON@HOTMAIL.COM +974,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,14-Nov-20,KRYSTAL_GIBSON,F,07-Apr-76,ARROYO_BARU,FDIAZ@HOTMAIL.COM +975,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,14-Nov-20,NICOLE_SANDERS,F,07-Oct-32,ZONA_DELTA_SAN_FERNANDO,YCLARK@HOTMAIL.COM +976,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,14-Nov-20,SANDRA_SNYDER,F,04-Feb-97,ALMA_GRANDE,FLORESMEGHAN@YAHOO.COM +977,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,14-Nov-20,CRYSTAL_JOHNSON,F,09-Jul-05,LA_PRIMAVERA,HROSE@GMAIL.COM +978,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,14-Nov-20,JONATHAN_CONNER,M,14-Jan-44,ESTRADA,LOGANPORTER@YAHOO.COM +979,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,14-Nov-20,SHELBY_BLACKWELL,F,18-Jul-92,COLONIA_CAZAUX,CHRISTINA23@HOTMAIL.COM +980,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,14-Nov-20,CHRISTINE_MUNOZ_DDS,F,06-Mar-85,BARRANCAS_COLORADAS,JACOB22@HOTMAIL.COM +981,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,14-Nov-20,ZACHARY_MILLER,M,27-Jul-00,CALFUCURA,LISANIXON@GMAIL.COM +982,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,14-Nov-20,TYLER_WILSON,M,01-Aug-36,ANGOSTURA,GLENNCRUZ@GMAIL.COM +983,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,14-Nov-20,LUIS_MCDANIEL,M,18-Mar-40,PILAR,TOWNSENDANA@GMAIL.COM +984,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,15-Nov-20,SARA_AYALA,F,17-Mar-07,CASBAS,LANDERSON@HOTMAIL.COM +985,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,15-Nov-20,ERIKA_BARR,F,18-Mar-93,COMANDANTE_GIRIBONE,JUSTINWALTER@HOTMAIL.COM +986,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,15-Nov-20,JORDAN_HANSEN,F,03-Sep-30,PILAR,CAROLYNDUKE@HOTMAIL.COM +987,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,15-Nov-20,KIMBERLY_OWENS,F,09-May-40,GANDOLFI,IWOODWARD@YAHOO.COM +988,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,15-Nov-20,KELLY_COBB,F,29-Nov-42,AGUA_BLANCA,DAWSONDARREN@GMAIL.COM +989,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,15-Nov-20,BRIAN_SCHMIDT,M,10-Dec-23,COLONIA_ESCRIBANO,LCASTRO@GMAIL.COM +990,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,15-Nov-20,NICOLE_ATKINS,F,16-Apr-18,ARROYO_CASCO,BRADADAMS@GMAIL.COM +991,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,15-Nov-20,BRIAN_MOORE,M,10-Jan-35,SAN_BERNARDO_DEL_TUYU,ROBERTDICKSON@GMAIL.COM +992,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,15-Nov-20,JENNIFER_RODRIGUEZ,F,16-Aug-09,EZPELETA_ESTE,LEWISERIK@GMAIL.COM +993,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,16-Nov-20,CHRISTOPHER_BARNETT,M,22-Apr-92,ALDEA_SAN_ANDRES,KEITH11@GMAIL.COM +994,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,16-Nov-20,MATTHEW_HODGE_DDS,M,14-Aug-43,EL_ARBOLITO,RODRIGUEZJENNIFER@YAHOO.COM +995,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,16-Nov-20,TAMMY_CLARK,F,22-Oct-43,ANDALUCIA,BRENDAHUNT@YAHOO.COM +996,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,16-Nov-20,WANDA_JONES,F,12-Sep-47,ROLDAN,THOMASPORTER@YAHOO.COM +997,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,16-Nov-20,NICOLE_HALE,F,25-Mar-13,CHAPI_TALO,KATHY93@HOTMAIL.COM +998,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,16-Nov-20,ERICA_WHEELER,F,28-Mar-98,CANNING,JASONSANCHEZ@HOTMAIL.COM +999,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,16-Nov-20,ANTHONY_BLAIR,M,27-Apr-19,CAÑADON_FERRAIS,JEANETTEJOHNSON@GMAIL.COM +1000,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,16-Nov-20,MICHAEL_WEBB,M,29-Mar-24,LA_LIMPIA,BRITTNEY20@YAHOO.COM +1001,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,16-Nov-20,BRENDAN_STARK,M,10-Dec-04,PIAMONTE,HOPKINSGERALD@GMAIL.COM +1002,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,16-Nov-20,MICHELE_WILEY,F,20-Aug-14,COLONIA_PUJOL,ZMONTOYA@HOTMAIL.COM +1003,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,16-Nov-20,JOHN_CARROLL,M,07-Jun-39,AVANZADA,THORNTONROBERT@YAHOO.COM +1004,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,16-Nov-20,BRYAN_MURRAY,M,20-Nov-57,ARMSTRONG,JESSICA40@GMAIL.COM +1005,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,16-Nov-20,JAMIE_MILLER,F,03-Jan-55,CORONEL_PRINGLES,XHALL@YAHOO.COM +1006,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,17-Nov-20,JAMIE_HARVEY,F,22-Oct-84,BARRIALITOS,LAUREN93@GMAIL.COM +1007,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,17-Nov-20,BRITTNEY_HAMILTON,F,08-Feb-91,EDUARDO_COSTA,ERICA82@GMAIL.COM +1008,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,17-Nov-20,MONICA_CAMPBELL,F,31-Dec-11,CAMPO_GIMENEZ,IMORRIS@GMAIL.COM +1009,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,17-Nov-20,CARRIE_MORRIS,F,22-May-21,SANCTI_SPIRITU,SAMUELMILLER@YAHOO.COM +1010,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,17-Nov-20,BRIANNA_BLACKWELL,F,04-May-25,ARTEAGA,JAMESBENNETT@HOTMAIL.COM +1011,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,17-Nov-20,JASON_FARLEY,M,08-Aug-17,AMALIA,UHAYES@YAHOO.COM +1012,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,17-Nov-20,JAMES_PHILLIPS,M,01-Jan-11,COLONIA_VALDEZ,WBRYAN@YAHOO.COM +1013,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,17-Nov-20,LAURA_MCGEE,F,31-Jan-08,VILLA_EL_CHOCON,WILKINSJOSHUA@YAHOO.COM +1014,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,17-Nov-20,LESLIE_BROWN,F,22-Jan-85,BAUER_Y_SIGEL,FLORESHEIDI@YAHOO.COM +1015,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,17-Nov-20,BREANNA_LEVY,F,21-May-20,ARROYO_CEIBAL,JASONCAMPBELL@GMAIL.COM +1016,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,17-Nov-20,MICHELLE_PORTER,F,31-Jul-13,CALVO,FOSTERBENJAMIN@YAHOO.COM +1017,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,17-Nov-20,BENJAMIN_VASQUEZ,M,16-Aug-70,17_DE_AGOSTO,ANNETTEKOCH@YAHOO.COM +1018,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,17-Nov-20,LINDA_LEONARD,F,22-Jun-14,ARAUCO,MARTINFRANCISCO@HOTMAIL.COM +1019,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,17-Nov-20,MARIAH_MARTINEZ,F,24-Jan-34,ALTO_GRANDE,KINGCHRISTY@HOTMAIL.COM +1020,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,17-Nov-20,JEFFREY_QUINN,M,07-Nov-05,BERUTI,EMARTINEZ@GMAIL.COM +1021,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,18-Nov-20,APRIL_ROSE,F,23-Jul-45,SIERRA_DE_LA_VENTANA,VANESSA38@YAHOO.COM +1022,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,18-Nov-20,STEPHEN_SCOTT,M,25-Sep-41,ALTO_DE_SIERRA,ALISON13@GMAIL.COM +1023,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,18-Nov-20,RYAN_ROJAS,M,28-Sep-20,CAMPO_HUBER,KELLYMCMILLAN@YAHOO.COM +1024,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,18-Nov-20,SUSAN_SMITH,F,23-Nov-27,ARTURO_SEGUI,SARAJOHNSON@HOTMAIL.COM +1025,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,18-Nov-20,FERNANDO_BOYD,M,04-Nov-38,DESPEÑADEROS,SOTOKEVIN@HOTMAIL.COM +1026,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,18-Nov-20,DANNY_CANNON,M,23-Nov-11,CINCO_SALTOS,KIMBERLYWYATT@YAHOO.COM +1027,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,18-Nov-20,BRIANNA_LUCAS,F,17-Jul-41,SANTOS_LUGARES,MIACASTILLO@GMAIL.COM +1028,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,18-Nov-20,MIKE_PATTON,M,03-Jan-65,ESTACION_YERUA,JARVISJENNIFER@GMAIL.COM +1029,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,18-Nov-20,LINDA_RIOS,F,02-Jul-54,ANECON_CHICO,KELLYPRICE@HOTMAIL.COM +1030,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,18-Nov-20,JUAN_MANN,M,16-Sep-87,GOBERNADOR_BENEGAS,AGUIRREJENNIFER@GMAIL.COM +1031,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,18-Nov-20,AMANDA_SMITH,F,03-Nov-29,BUEN_RETIRO,WILLIAMSALLISON@GMAIL.COM +1032,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,18-Nov-20,EVELYN_GONZALEZ,F,29-Aug-58,ESTRADA,CHRISTOPHER21@HOTMAIL.COM +1033,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,19-Nov-20,MANUEL_THOMPSON,M,12-Jan-66,SANCTI_SPIRITU,DHAWKINS@GMAIL.COM +1034,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,19-Nov-20,FRANK_VILLA,M,21-Apr-21,GENERAL_SAN_MARTIN,QHAMILTON@YAHOO.COM +1035,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,19-Nov-20,HEATHER_PARKER,F,18-Dec-93,LA_BANDA,WARNERERIN@HOTMAIL.COM +1036,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,19-Nov-20,ELIZABETH_SPARKS,F,22-Jul-58,MEMBRILLAR,CLIN@HOTMAIL.COM +1037,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,19-Nov-20,DANIEL_LOPEZ,M,12-Jan-62,BLAS_DURAÑONA,OBRIENDAVID@GMAIL.COM +1038,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,19-Nov-20,MRS._JORDAN_GONZALEZ,F,25-Oct-68,CAÑADA,KJACKSON@GMAIL.COM +1039,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,20-Nov-20,DAVID_RANDOLPH,M,27-Nov-10,CASTILLA,LEAHEDWARDS@YAHOO.COM +1040,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,20-Nov-20,ANTONIO_LEE,M,21-Aug-85,COLONIA_BARON_HIRSCH,SGUTIERREZ@HOTMAIL.COM +1041,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,20-Nov-20,AUDREY_FLOWERS,F,07-Oct-55,EL_ALTO,STEVEN90@YAHOO.COM +1042,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,20-Nov-20,SUSAN_SIMMONS,F,02-Feb-09,ALDAO,SARAH17@GMAIL.COM +1043,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,20-Nov-20,AUSTIN_GREEN,M,25-Aug-36,LIBERTAD,RHARDIN@HOTMAIL.COM +1044,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,20-Nov-20,CHAD_KELLEY,M,22-Sep-91,SAN_JOSE,GHARRIS@HOTMAIL.COM +1045,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,20-Nov-20,AMANDA_LAWSON_DDS,F,30-Jul-07,DESVIO_KILOMETRO_234,SAMANTHAOWEN@YAHOO.COM +1046,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,20-Nov-20,DERRICK_MOORE,M,22-May-41,EL_ALTO,OMAR43@YAHOO.COM +1047,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,20-Nov-20,CINDY_TORRES,F,30-Aug-17,CHICHAGASTA,BENSONJAMES@GMAIL.COM +1048,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,20-Nov-20,LEAH_ANDREWS,F,30-Oct-13,DIAMANTE,LOVENATASHA@GMAIL.COM +1049,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,20-Nov-20,REGINA_BAUER,F,20-Mar-85,CALCHAQUI,HWELLS@YAHOO.COM +1050,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,20-Nov-20,JODY_WILLIAMS,F,05-Jul-02,BAÑADO_SAN_ANTONIO,FOWLERWILLIAM@HOTMAIL.COM +1051,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,21-Nov-20,STEVEN_REEVES,M,19-Jul-21,BARRA_BONITA,KNAPPJENNIFER@GMAIL.COM +1052,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,21-Nov-20,SHANNON_BECKER,F,18-Jan-89,ALFREDO_DEMARCHI,UTHOMAS@YAHOO.COM +1053,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,21-Nov-20,RICHARD_MILLER,M,17-Nov-28,ALAMO,JUSTIN89@HOTMAIL.COM +1054,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,21-Nov-20,RAYMOND_ANDREWS,M,11-Apr-94,VILLA_SABOYA,PAULHAMILTON@GMAIL.COM +1055,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,21-Nov-20,CAROL_BLAKE,F,25-Nov-57,ALPATACAL,DANIELBURCH@GMAIL.COM +1056,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,21-Nov-20,ANTHONY_BAIRD,M,08-Sep-70,JOSE_CLEMENTE_PAZ,HERNANDEZANDREW@HOTMAIL.COM +1057,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,21-Nov-20,BRADLEY_ANDERSON,M,28-Jul-14,FAVELLI,COCHRANBRITTANY@GMAIL.COM +1058,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,22-Nov-20,MARC_BURTON,M,30-Jun-98,GORCHS,JORDANROBERT@YAHOO.COM +1059,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,22-Nov-20,COURTNEY_RAMIREZ,F,01-Feb-10,EL_CHALTEN,SARAH63@YAHOO.COM +1060,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,22-Nov-20,JAMES_PORTER,M,06-Mar-10,EL_PINO,HWARD@YAHOO.COM +1061,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,22-Nov-20,STACEY_RUSSELL,F,25-Aug-51,COSTA_DEL_RIO_AZUL,JENNIFER99@YAHOO.COM +1062,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,22-Nov-20,MR._KENNETH_SMITH_MD,M,11-Dec-20,BATERIAS,DANIELLELEE@YAHOO.COM +1063,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,22-Nov-20,LARRY_HERRERA,M,02-Feb-96,ARROYO_CEIBAL,DANIELSJEAN@YAHOO.COM +1064,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,22-Nov-20,AMY_RHODES,F,06-Feb-33,ERNESTINA,TRACEYSHARP@HOTMAIL.COM +1065,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,22-Nov-20,DANIEL_SHORT,M,03-Mar-71,EL_GUANACO,CINDYHALL@YAHOO.COM +1066,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,22-Nov-20,KAITLIN_WADE,F,13-Jan-05,DOCTOR_DOMINGO_HAROSTEGUY,LUISCARTER@YAHOO.COM +1067,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,22-Nov-20,LAUREN_GONZALEZ,F,23-Nov-42,DUDIGNAC,WILLIAMSSAMUEL@YAHOO.COM +1068,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,22-Nov-20,ANA_PHILLIPS,F,17-Oct-31,CORONEL_ISLEÑOS,LINDA96@HOTMAIL.COM +1069,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,22-Nov-20,SCOTT_MCCARTHY_PHD,M,28-Oct-32,ALGARROBO,JON76@YAHOO.COM +1070,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,22-Nov-20,MARCUS_MURPHY,M,06-Nov-53,COLMAN,TYLERALLISON@YAHOO.COM +1071,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,22-Nov-20,MOLLY_CURTIS,F,28-Jun-17,ARAÑITA,ANNA26@YAHOO.COM +1072,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,22-Nov-20,AMBER_GRAHAM,F,05-Mar-31,AGUSTONI,KRISTINACOMPTON@YAHOO.COM +1073,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,22-Nov-20,TRACY_GIBBS,F,18-May-81,FLORENCIO_VARELA,THOMASTAMMY@GMAIL.COM +1074,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,22-Nov-20,LAURIE_BROWN,F,24-Jun-59,SAN_ISIDRO,MICHAEL35@HOTMAIL.COM +1075,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,22-Nov-20,TINA_BERG,F,04-Jun-53,ZONA_DELTA_TIGRE,BOWERSNATALIE@YAHOO.COM +1076,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,23-Nov-20,MARY_BAILEY,F,30-Dec-85,AMERICA_UNIDA,REGINACHURCH@GMAIL.COM +1077,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,23-Nov-20,MARY_TOWNSEND,F,03-May-64,CHIMPAY,THOFFMAN@GMAIL.COM +1078,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,23-Nov-20,LISA_ROGERS,F,16-Sep-23,JUANCHO,WRIGHTMICHAEL@YAHOO.COM +1079,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,23-Nov-20,BRIAN_CRUZ,M,27-Oct-33,CAMPO_DE_LOS_ANDES,SJOHNSON@GMAIL.COM +1080,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,23-Nov-20,MRS._LAURA_SMITH,F,15-Oct-67,BARRANQUERAS,ROBERT73@YAHOO.COM +1081,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,23-Nov-20,PATRICIA_MARTIN,F,23-Jun-10,ASCENCION,THODGES@GMAIL.COM +1082,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,23-Nov-20,JOSHUA_BELL,M,09-Nov-71,COLONIA_DEVOTO,ANDRESTATE@YAHOO.COM +1083,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,24-Nov-20,LESLIE_MACDONALD,F,30-Nov-11,CENTRO_AGRICOLA_EL_PATO,LEWISKRISTEN@HOTMAIL.COM +1084,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,24-Nov-20,BRADLEY_HERNANDEZ,M,17-Feb-38,16_DE_JULIO,SANDRAWEBSTER@HOTMAIL.COM +1085,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,24-Nov-20,MARK_JOHNSON,M,01-May-07,AGUA_COLORADA,BROWNTRAVIS@HOTMAIL.COM +1086,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,24-Nov-20,JOANNA_KEY,F,05-Oct-50,LAS_TONINAS,ELIZABETH94@GMAIL.COM +1087,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,24-Nov-20,PATRICIA_MUNOZ,F,13-Mar-97,CAFFERATA,AMILLER@YAHOO.COM +1088,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,24-Nov-20,LAURIE_SCHMITT,F,21-Jul-08,SANCTI_SPIRITU,TRAVISWALKER@GMAIL.COM +1089,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,24-Nov-20,DUSTIN_WRIGHT,M,01-Nov-21,CAMPO_BOTTO,ZMORENO@HOTMAIL.COM +1090,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,24-Nov-20,JENNIFER_OLSEN,F,20-Jul-78,ARSENAL_DE_GUERRA_SAN_LORENZO,SHELTONCRYSTAL@YAHOO.COM +1091,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,24-Nov-20,BARBARA_PEREZ,F,15-Mar-38,ARRAYANAL,CLARKMICHAEL@GMAIL.COM +1092,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,24-Nov-20,JACOB_SPARKS_MD,M,18-Jan-89,COLONIA_EGIDO,CASSIE03@YAHOO.COM +1093,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,25-Nov-20,JOHN_ENGLISH,M,26-Jul-20,ALGARROBAL_PUISOYE,ERINGARCIA@HOTMAIL.COM +1094,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,25-Nov-20,BRIAN_CLARK,M,11-Sep-28,CARCARAÑA,FERNANDO28@HOTMAIL.COM +1095,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,25-Nov-20,JESSICA_STEWART,F,11-Dec-10,ABRA_MAYO,BRENDA74@YAHOO.COM +1096,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,25-Nov-20,ALYSSA_GEORGE,F,06-Dec-49,BOCAS,STACEY81@GMAIL.COM +1097,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,25-Nov-20,KELLY_HENRY,F,23-Sep-12,GRUTLY,MILLERJARED@YAHOO.COM +1098,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,25-Nov-20,DAVID_MCCOY,M,16-Feb-10,COLONIA_ZAPATA,ALLENRONNIE@GMAIL.COM +1099,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,25-Nov-20,TIMOTHY_AGUIRRE,M,21-Jun-42,VILLA_OLIVARI,DYOUNG@YAHOO.COM +1100,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,25-Nov-20,KIRK_ROBINSON,M,26-Sep-60,ALTO_PENCOSO,XTHOMPSON@YAHOO.COM +1101,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,25-Nov-20,KYLE_GROSS,M,12-Apr-81,ARROYO_GRANDE,RANDYLONG@YAHOO.COM +1102,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,25-Nov-20,MARY_LEE,F,12-Dec-18,BALSA_SENILLOSA,ADAMHILL@HOTMAIL.COM +1103,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,25-Nov-20,NICOLE_HOPKINS,F,09-Jun-02,ACHERAL,CHRISTOPHER41@GMAIL.COM +1104,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,25-Nov-20,RACHEL_JOHNSON,F,01-Jun-53,COLONIA_BELLA_ITALIA,UWILSON@HOTMAIL.COM +1105,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,25-Nov-20,DALE_LONG,M,06-Jun-80,20_DE_JUNIO,MATTHEW93@GMAIL.COM +1106,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,25-Nov-20,MICHELLE_HOLMES,F,31-May-72,PRIMERA_JUNTA,GONZALEZVANESSA@YAHOO.COM +1107,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,25-Nov-20,KRISTINE_SULLIVAN,F,30-May-21,BERAZATEGUI,FLOWERSJAMES@YAHOO.COM +1108,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,25-Nov-20,MATTHEW_GUTIERREZ,M,28-Jul-08,CANDELARIA,TIFFANYDAVIS@YAHOO.COM +1109,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,25-Nov-20,CARLOS_SMITH,M,18-Jul-49,ALIJILAN,MATTHEW57@YAHOO.COM +1110,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,26-Nov-20,JOHN_JENKINS,M,14-Aug-70,25_DE_MAYO,REYNOLDSKENNETH@GMAIL.COM +1111,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,26-Nov-20,PAMELA_MAYO,F,24-Mar-71,AGUA_SALADA,JULIEJONES@HOTMAIL.COM +1112,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,26-Nov-20,TIMOTHY_WILSON,M,28-Jun-16,BAÑOS_DE_LA_LAJA,ANTHONY97@GMAIL.COM +1113,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,26-Nov-20,JORDAN_GRIFFIN,M,24-Oct-07,BALSA,KRISTINBALDWIN@YAHOO.COM +1114,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,26-Nov-20,LINDSAY_OBRIEN,F,08-Oct-88,AGUA_COLORADA,IFARRELL@GMAIL.COM +1115,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,26-Nov-20,CHRISTIE_THOMAS,F,19-May-90,BERRETTA,DBROOKS@YAHOO.COM +1116,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,26-Nov-20,RICHARD_STEVENS,M,04-Jul-76,COLONIA_ZAPATA,TERRY03@HOTMAIL.COM +1117,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,26-Nov-20,TIFFANY_JONES,F,27-Aug-85,JOSE_FERRARI,NOLSON@YAHOO.COM +1118,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,27-Nov-20,TIMOTHY_ANDERSON,M,04-Dec-06,ARISTIDES_VILLANUEVA,KINGWENDY@HOTMAIL.COM +1119,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,27-Nov-20,SHARON_RANDOLPH,F,27-Jan-49,EL_RETIRO,MCKINNEYKIMBERLY@YAHOO.COM +1120,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,27-Nov-20,JESSICA_FORD,F,05-Jul-24,BAÑADITO_VIEJO,JAMESPALMER@GMAIL.COM +1121,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,27-Nov-20,ZACHARY_FISHER,M,06-Feb-62,ADELA,KPRICE@YAHOO.COM +1122,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,27-Nov-20,SUE_HUGHES,F,08-Jan-21,AGUA_AMARILLA_LA_HOYADA,SANDRAJIMENEZ@GMAIL.COM +1123,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,27-Nov-20,THERESA_JOHNSON,F,07-Feb-68,AGUA_DE_DIAZ,HARVEYKELSEY@GMAIL.COM +1124,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,27-Nov-20,CRAIG_YOUNG,M,11-Apr-10,CENTINELA,DANIEL34@GMAIL.COM +1125,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,27-Nov-20,ROBERT_MCCLURE,M,22-Oct-24,ARROYO_CAHUNCO,MATTHEWBECK@HOTMAIL.COM +1126,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,27-Nov-20,DEBBIE_CRAIG,F,01-Oct-57,COLONIA_MORGAN,DHARVEY@GMAIL.COM +1127,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,27-Nov-20,COURTNEY_JONES,F,18-Dec-55,ARTURO_VATTEONE,MICHELLEFORD@YAHOO.COM +1128,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,27-Nov-20,MARY_RODRIGUEZ,F,14-Feb-71,COLONIA_ABATE,KELLY27@YAHOO.COM +1129,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,27-Nov-20,SANDY_REYES,F,04-May-10,ARMINDA,EMILYBOYLE@YAHOO.COM +1130,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,28-Nov-20,AMANDA_COX,F,13-Apr-26,ESTANCIA_SANTA_CATALINA,VCAMPBELL@GMAIL.COM +1131,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,28-Nov-20,AMBER_LOPEZ,F,19-May-17,COLIQUEO,CAMPBELLALLEN@HOTMAIL.COM +1132,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,28-Nov-20,TARA_TRAN,F,13-Jul-16,BARRANQUITAS,PATELMACKENZIE@YAHOO.COM +1133,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,28-Nov-20,EDWARD_WHEELER,M,02-Nov-63,BONNEMENT,BURNETTBRIAN@YAHOO.COM +1134,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,28-Nov-20,HOWARD_COHEN,M,02-Mar-67,CERRO_ACONCAGUA,MICHAELNICHOLS@YAHOO.COM +1135,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,28-Nov-20,COLLEEN_SMITH,F,19-Nov-36,SANTA_TERESITA,NHARVEY@GMAIL.COM +1136,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,28-Nov-20,DAVID_FLORES,M,20-Apr-33,ALTAMIRANO_NORTE,FLOWERSKAITLYN@GMAIL.COM +1137,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,28-Nov-20,GARY_DAVIES,M,20-Jun-62,LOS_CORREDORES,PBRADY@GMAIL.COM +1138,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,28-Nov-20,RENEE_WILLIAMS,F,01-Dec-48,SAN_GERONIMO,VICTORIA69@GMAIL.COM +1139,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,28-Nov-20,ELIZABETH_TAYLOR,F,04-Nov-55,ALTAMIRA,MCCULLOUGHMARY@YAHOO.COM +1140,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,28-Nov-20,HEATHER_FISHER,F,19-Nov-76,ARROYO_CHALIA,ERIN73@GMAIL.COM +1141,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,28-Nov-20,TIMOTHY_MEDINA,M,18-Oct-11,ANTONIO_TOMAS,ERIN20@YAHOO.COM +1142,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,28-Nov-20,SUSAN_YOUNG,F,25-Mar-09,CAMPO_QUIÑONES,AMY45@YAHOO.COM +1143,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,28-Nov-20,MICHELE_ALVAREZ,F,03-Nov-10,AGUA_COLORADA,CHRISTINE92@YAHOO.COM +1144,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,29-Nov-20,GREGORY_BENITEZ,M,21-Jul-78,DE_BRUYN,COLLINSJENNIFER@HOTMAIL.COM +1145,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,29-Nov-20,THERESA_HUDSON,F,05-Oct-45,VALLE_DE_LAS_LEÑAS,BONILLAMICHAEL@GMAIL.COM +1146,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,29-Nov-20,YVONNE_MCINTOSH,F,15-May-41,BATAVIA,KIMBERLYSCOTT@HOTMAIL.COM +1147,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,29-Nov-20,JOSHUA_HARRIS,M,16-Apr-75,ARBOL_SOLO,OLIVIARIVERA@HOTMAIL.COM +1148,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,29-Nov-20,SARAH_AGUIRRE,F,02-Dec-01,CRISTIANO_MUERTO,PAUL08@GMAIL.COM +1149,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,29-Nov-20,KATHERINE_RODRIGUEZ,F,18-Dec-90,ARTURO_SEGUI,DEBORAH45@YAHOO.COM +1150,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,29-Nov-20,DAVID_BAKER,M,30-Apr-17,ALBERTI,CHRISTIANSMITH@GMAIL.COM +1151,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,29-Nov-20,AMBER_MANN,F,13-Mar-18,LA_LUCILA,SUSAN22@HOTMAIL.COM +1152,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,29-Nov-20,CHRISTOPHER_OWENS,M,04-May-28,16_DE_JULIO,STEPHANIE42@YAHOO.COM +1153,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,29-Nov-20,KELLY_MONTOYA,F,14-Jul-10,ACEBAL,DARRENHAMPTON@YAHOO.COM +1154,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,30-Nov-20,JULIA_CHAPMAN,F,18-Oct-69,CHAPUY,JULIEWARREN@YAHOO.COM +1155,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,30-Nov-20,NICHOLAS_KING,M,03-Mar-17,BARRIO_CHAPADMALAL,TINAMEYER@YAHOO.COM +1156,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,30-Nov-20,JULIE_MACIAS,F,30-Jun-47,SAN_JOSE_DE_PIEDRA_BLANCA,HABBOTT@GMAIL.COM +1157,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,30-Nov-20,CHRISTOPHER_CHAMBERS,M,24-Jun-85,30_DE_AGOSTO,MATTHEWVASQUEZ@YAHOO.COM +1158,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,30-Nov-20,MAUREEN_MCCALL,F,01-May-34,CAPITAN_CASTRO,STEPHEN46@HOTMAIL.COM +1159,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,30-Nov-20,BRADLEY_WRIGHT,M,10-Jul-00,BARRIO_FERRI,PAULA34@GMAIL.COM +1160,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,30-Nov-20,CASSIE_BLACKWELL,F,04-Jan-48,BARRIO_PARQUE_LELOIR,ANGELARAMOS@YAHOO.COM +1161,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,30-Nov-20,BETHANY_HENDERSON,F,18-Jun-16,EL_CHUMBEAU,HENDERSONADRIENNE@HOTMAIL.COM +1162,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,30-Nov-20,EMILY_FOLEY,F,26-Sep-10,ANASAGASTI,ANDREATHOMAS@YAHOO.COM +1163,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,30-Nov-20,PATRICK_PEARSON,M,12-Oct-76,JUAN_F_IBARRA,CPHILLIPS@GMAIL.COM +1164,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,30-Nov-20,DEVIN_MCCOY,M,20-Feb-81,SAN_ISIDRO,DARRENRYAN@HOTMAIL.COM +1165,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,30-Nov-20,RHONDA_CALLAHAN,F,05-Feb-66,GENERAL_CONESA,IBROWN@YAHOO.COM +1166,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,30-Nov-20,JAMES_ROGERS,M,18-Jul-65,AGUA_BOTADA,JAMES06@HOTMAIL.COM +1167,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,30-Nov-20,DAVID_BARBER,M,07-Jun-09,EL_ARBOLITO,TAMMY18@YAHOO.COM +1168,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,30-Nov-20,DARRELL_GRIFFIN,M,26-Apr-35,VILLA_LERGA,BRADLEY12@GMAIL.COM +1169,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,01-Dec-20,STACEY_WATTS,F,13-Jul-33,DINA_HUAPI,REGINALDDAVIS@GMAIL.COM +1170,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,01-Dec-20,ZACHARY_MCDONALD,M,29-Jun-06,AGUA_AZUL,BOWENALISON@HOTMAIL.COM +1171,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,01-Dec-20,CHRISTOPHER_ROBERTS,M,27-Jun-59,2_DE_JULIO,PERRYMATTHEW@YAHOO.COM +1172,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,01-Dec-20,DENNIS_FORD,M,19-Sep-35,AMAMBAY,ANNETTE41@HOTMAIL.COM +1173,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,01-Dec-20,BRIAN_ALEXANDER,M,06-Nov-03,CAÑADON_FERRAIS,AVILAYVETTE@YAHOO.COM +1174,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,01-Dec-20,RACHEL_KRUEGER,F,22-Sep-84,CAÑADON_LAGARTO,CHAVEZJOHN@YAHOO.COM +1175,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,01-Dec-20,JENNA_HUBER,F,09-Jan-07,ALBARDON,DADAMS@GMAIL.COM +1176,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,01-Dec-20,COURTNEY_GRANT,F,01-Aug-76,ARBOL_SOLO,MICHAEL11@GMAIL.COM +1177,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,01-Dec-20,BRANDON_JONES,M,03-Jun-14,ARROYO_PESCADO,DENISE90@GMAIL.COM +1178,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,01-Dec-20,SANDRA_PEREZ,F,20-May-58,JUAN_VELA,UJACOBS@HOTMAIL.COM +1179,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,02-Dec-20,KARL_REED,M,07-Feb-88,CAMPO_EL_MATACO,NWATKINS@YAHOO.COM +1180,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,02-Dec-20,TERESA_VELASQUEZ,F,06-Feb-26,ALGARROBO,MICHAELNELSON@GMAIL.COM +1181,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,02-Dec-20,PATRICK_WILLIAMS,M,17-Apr-62,CENTRO_AGRICOLA_EL_PATO,JOHNSONDONNA@GMAIL.COM +1182,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,02-Dec-20,TAYLOR_KRAMER,M,19-Oct-16,CULLIN_MANZANO,COURTNEY43@HOTMAIL.COM +1183,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,02-Dec-20,LINDA_CHRISTIAN,F,03-Dec-05,AGUADA_DE_PIEDRA,JAMES55@GMAIL.COM +1184,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,02-Dec-20,NATALIE_SMITH,F,06-Mar-87,VILLA_LERGA,FRANKLIN28@YAHOO.COM +1185,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,02-Dec-20,MATTHEW_ROMERO,M,10-Feb-03,AGUAS_VERDES,JOSEPH54@GMAIL.COM +1186,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,02-Dec-20,BRIANNA_HOUSTON,F,08-Mar-53,CAÑADON_CALIENTE,CRYSTAL13@YAHOO.COM +1187,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,02-Dec-20,BENJAMIN_MILLER,M,25-Apr-54,ALDEA_FORESTAL,COOPERADRIANA@GMAIL.COM +1188,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,02-Dec-20,JAMES_BURNS,M,10-Aug-83,DON_TORCUATO,JKING@HOTMAIL.COM +1189,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,02-Dec-20,RUSSELL_MARTIN,M,12-Feb-13,ARROYO_CORTO,TYLER82@GMAIL.COM +1190,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,02-Dec-20,HEATHER_WALKER,F,05-Apr-09,EL_DIQUE,CHARLES32@YAHOO.COM +1191,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,02-Dec-20,ERIN_BEARD,F,08-Jun-31,COLONIA_JAUREGUI,KAYLACOLE@GMAIL.COM +1192,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,02-Dec-20,SHANNON_ANDERSON,F,28-Jun-18,ATALIVA_ROCA,TCRUZ@YAHOO.COM +1193,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,02-Dec-20,MADISON_SMALL,F,11-Apr-69,IGARZABAL,BOWENBRETT@YAHOO.COM +1194,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,03-Dec-20,AMY_ARNOLD,F,10-Jan-03,ALPACHIRI,QUINNALISHA@GMAIL.COM +1195,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,03-Dec-20,MARY_MERCADO,F,11-Apr-84,10_DE_MAYO,COPELANDAMY@GMAIL.COM +1196,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,03-Dec-20,KATHY_FOWLER,F,04-Jul-17,VALLE_DE_LAS_LEÑAS,DKING@HOTMAIL.COM +1197,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,03-Dec-20,BRETT_FLORES,M,12-Jul-56,CACHEL,REBECCAPEREZ@YAHOO.COM +1198,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,03-Dec-20,MARY_DAVIS,F,15-Oct-54,ALTO_DE_SIERRA,WESTERIN@HOTMAIL.COM +1199,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,03-Dec-20,BRENDA_SHEPHERD,F,19-Apr-19,ASUNCION_MARIA,BRITTNEY50@HOTMAIL.COM +1200,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,03-Dec-20,COURTNEY_CASTRO,F,17-Mar-66,FLORENTINO_AMEGHINO,ANGELA75@YAHOO.COM +1201,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,03-Dec-20,JEFFREY_KELLEY,M,17-Aug-24,CAMPO_LARGO,XJOHNSON@GMAIL.COM +1202,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,03-Dec-20,ALLISON_ROACH,F,14-Aug-08,LA_MOROCHA,KRISTINA87@HOTMAIL.COM +1203,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,03-Dec-20,MR._STEPHEN_HERNANDEZ_DDS,M,05-Mar-18,DIAMANTE,BRIANNARODRIGUEZ@HOTMAIL.COM +1204,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,04-Dec-20,FRANK_PRUITT,M,08-Aug-77,LA_SARA,LEJOHN@YAHOO.COM +1205,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,04-Dec-20,MRS._JULIE_SMITH,F,10-Oct-53,BUENA_VISTA,KARENCRUZ@YAHOO.COM +1206,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,04-Dec-20,MIKAYLA_GRAY,F,02-May-91,AGUA_AZUL,LORI87@HOTMAIL.COM +1207,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,04-Dec-20,ROBERT_RICHARDSON_III,M,06-Aug-50,SAN_ISIDRO,JOELCOLE@GMAIL.COM +1208,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,04-Dec-20,JEREMY_SMITH,M,15-Aug-05,EL_HOYO,TODD40@YAHOO.COM +1209,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,04-Dec-20,AMANDA_STRONG,F,30-Mar-02,COMODORO_RIVADAVIA,JROJAS@HOTMAIL.COM +1210,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,04-Dec-20,PAULA_WALKER,F,11-Jun-50,ARROYO_CORTO,DALTONJUSTIN@GMAIL.COM +1211,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,04-Dec-20,DEBORAH_LEE,F,23-Oct-81,CORRAL_DE_PIEDRAS,CFISHER@YAHOO.COM +1212,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,04-Dec-20,BETH_DIXON,F,03-Mar-11,ALTO_GRANDE,WYATT89@HOTMAIL.COM +1213,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,04-Dec-20,EMILY_FOWLER,F,06-Jan-04,BALCARCE,XMAY@GMAIL.COM +1214,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,04-Dec-20,KELSEY_JOHNSON,F,16-Nov-95,CARAGUATAY,ETURNER@HOTMAIL.COM +1215,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,04-Dec-20,MICHELLE_CASTILLO,F,15-Oct-90,LOS_ANTIGUOS,CHRISTOPHERMORALES@YAHOO.COM +1216,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,04-Dec-20,JENNIFER_PETERSEN,F,08-Dec-50,CARAHUNCO,WDORSEY@HOTMAIL.COM +1217,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,04-Dec-20,JAMIE_COMPTON,F,20-Nov-85,EL_PIMPOLLO,KIMBERLY66@HOTMAIL.COM +1218,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,04-Dec-20,GARY_LANE,M,14-Feb-07,COLONIA_CALIFORNIA,FOSTERJEFFREY@HOTMAIL.COM +1219,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,05-Dec-20,JOHN_SMITH,M,30-Mar-37,ALPACHIRI,TIMOTHY61@GMAIL.COM +1220,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,05-Dec-20,ROBERT_NAVARRO,M,18-Jun-62,ARROYO_CEIBAL,CHUNGSTEPHEN@YAHOO.COM +1221,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,05-Dec-20,BONNIE_STEVENS,F,16-Nov-43,ADOLFO_ALSINA,COFFEYWILLIAM@HOTMAIL.COM +1222,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,05-Dec-20,DEREK_BAILEY,M,15-Jan-41,COLONIA_DOS_ROSAS_Y_LA_LEGUA,HALEYRODRIGUEZ@YAHOO.COM +1223,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,06-Dec-20,BLAKE_COOK,M,21-Mar-77,EL_PERDIDO_EST_JOSE_GUISASOLA,JACKSONAMY@YAHOO.COM +1224,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,06-Dec-20,BRITTANY_BRADSHAW,F,18-Mar-00,RICARDO_LAVALLE,HARRISSEAN@HOTMAIL.COM +1225,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,06-Dec-20,KAREN_STANLEY,F,02-Feb-09,AGUADA_DE_LA_PEÑA,HORNEJASON@YAHOO.COM +1226,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,06-Dec-20,JENNIFER_CLARK,F,16-Dec-16,BELLA_ITALIA,PRICESTEVEN@HOTMAIL.COM +1227,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,06-Dec-20,HALEY_ANDREWS,F,11-Sep-34,AGUA_DEL_SIMBOL,SEAN04@GMAIL.COM +1228,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,06-Dec-20,REBECCA_HOLMES,F,30-Dec-18,9_DE_JULIO,TYLERDECKER@HOTMAIL.COM +1229,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,06-Dec-20,BETH_NELSON,F,24-Aug-12,AMALIA,ASHLEY22@HOTMAIL.COM +1230,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,06-Dec-20,TERESA_HARDY,F,11-Jul-19,AGUA_SALADA,STEWARTSTACEY@YAHOO.COM +1231,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,06-Dec-20,SHERRI_GROSS,F,22-Nov-13,ARROYO_PALMAR,DELEONSARA@HOTMAIL.COM +1232,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,06-Dec-20,CHRISTINE_CURRY,F,16-May-18,MARIA_MAGDALENA,WILSONCHRISTOPHER@HOTMAIL.COM +1233,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,07-Dec-20,BRETT_VARGAS,M,29-Oct-24,GUAMINI,SAVILA@HOTMAIL.COM +1234,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,07-Dec-20,LESLIE_BRYAN,F,15-Jan-72,HUGHES,CHANGCHRISTINE@GMAIL.COM +1235,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,07-Dec-20,JULIE_NORMAN_DVM,F,19-Oct-57,AGUA_AMARGA,ELLIOTTDOUGLAS@YAHOO.COM +1236,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,07-Dec-20,SHANNON_ALLEN,F,12-Feb-22,BARRIO_CHAPADMALAL,LCHAVEZ@GMAIL.COM +1237,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,07-Dec-20,LISA_WHITE,F,25-Feb-16,VALENTIN_ALSINA,SHERRERA@HOTMAIL.COM +1238,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,07-Dec-20,JASON_RODRIGUEZ,M,14-Jan-97,ALDEA_BRASILERA,ASHLEYENGLISH@YAHOO.COM +1239,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,07-Dec-20,ERIC_GRIFFITH,M,04-Sep-41,ALEJANDRO_PETION,FROSTBETH@YAHOO.COM +1240,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,07-Dec-20,DENISE_GILBERT,F,31-Oct-89,VILLA_HIPODROMO,FREED@HOTMAIL.COM +1241,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,07-Dec-20,BRIAN_RAY,M,10-Mar-79,ABASTO,SEAN56@YAHOO.COM +1242,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,07-Dec-20,RICHARD_GRIFFITH,M,10-Jul-69,ABRA_DEL_TAFI,RAMSEYALEX@YAHOO.COM +1243,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,07-Dec-20,CHRISTOPHER_COOKE,M,24-Feb-02,CALERA_ARGENTINA,JAMIEBOYLE@YAHOO.COM +1244,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,07-Dec-20,TRACY_SCHAEFER,F,01-Dec-23,BANFIELD,XBROWN@HOTMAIL.COM +1245,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,07-Dec-20,ANGELA_MALONE,F,14-Mar-69,CHICLANA,RYANJIMENEZ@GMAIL.COM +1246,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,07-Dec-20,MRS._ROBYN_MCCARTY,F,18-Jan-12,ABRA_DEL_TRIGO,SHARON50@HOTMAIL.COM +1247,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,07-Dec-20,JUSTIN_DAVIS,M,28-Nov-85,CHIVILCOY,GOULDLAURA@YAHOO.COM +1248,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,07-Dec-20,BRIAN_TANNER,M,18-Aug-36,ALCARAZ_NORTE,TIFFANYHOLT@GMAIL.COM +1249,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,07-Dec-20,JENNIFER_TAYLOR,F,30-Jun-45,COSTA_GRANDE,ROSERICHARD@GMAIL.COM +1250,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,07-Dec-20,PATRICIA_HOWARD,F,24-Dec-82,CAÑADITA,MICHAELWILSON@HOTMAIL.COM +1251,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,07-Dec-20,KRISTIN_ROGERS,F,28-May-57,CAÑADON_CHILENO,MICHAELHARRISON@YAHOO.COM +1252,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,08-Dec-20,DAVID_ARMSTRONG,M,03-Sep-17,COLONIA_FALCO,JIMMYFERNANDEZ@GMAIL.COM +1253,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,08-Dec-20,KIMBERLY_HOPKINS,F,18-Jan-20,ARTEAGA,AJONES@HOTMAIL.COM +1254,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,08-Dec-20,BRANDON_BARRY,M,06-Feb-45,AGUA_AMARILLA_LA_HOYADA,HEATHER53@YAHOO.COM +1255,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,08-Dec-20,JASON_HARDIN,M,01-Jan-92,MARIANO_ACOSTA,MARK10@GMAIL.COM +1256,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,08-Dec-20,JILL_GARDNER,F,14-Sep-20,COLONIA_1_DE_MAYO,JENKINSJEREMY@HOTMAIL.COM +1257,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,08-Dec-20,CATHERINE_DUNCAN,F,20-Aug-84,EL_ZURDO,BROOKSMONIQUE@YAHOO.COM +1258,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,08-Dec-20,JEFFREY_KIM,M,29-Jan-79,ALGARROBO_GRANDE,MARYCONLEY@GMAIL.COM +1259,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,08-Dec-20,SUZANNE_REYNOLDS,F,26-Aug-95,LA_ORIENTAL,VNELSON@YAHOO.COM +1260,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,08-Dec-20,BELINDA_ANDERSON,F,20-Sep-89,ALTO_LINDO,HAYLEY27@HOTMAIL.COM +1261,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,08-Dec-20,ANGELA_MARTIN,F,24-Mar-20,BARADERO,WMARSHALL@HOTMAIL.COM +1262,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,08-Dec-20,JOHN_HENDRICKS,M,15-Sep-51,BUENA_VISTA,DONALD26@GMAIL.COM +1263,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,08-Dec-20,JASON_VILLEGAS,M,26-Oct-94,LAS_PALMAS,JOHN30@HOTMAIL.COM +1264,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,08-Dec-20,JOHN_MITCHELL,M,14-Aug-75,EL_CENIZO,RICHARDGONZALES@HOTMAIL.COM +1265,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,08-Dec-20,ALICIA_BRIDGES,F,11-May-99,COMANDANTE_GRANVILLE,DAVIDRUIZ@YAHOO.COM +1266,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,08-Dec-20,WILLIAM_MALONE,M,26-Sep-70,3_DE_MAYO,BLAKEGIBSON@HOTMAIL.COM +1267,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,09-Dec-20,JENNIFER_MOSS,F,14-Apr-08,IRENEO_PORTELA,ALLISON27@GMAIL.COM +1268,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,09-Dec-20,MARTIN_BAILEY,M,26-Sep-89,CHAPUY,BROWNZACHARY@YAHOO.COM +1269,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,09-Dec-20,AMANDA_WHITE,F,28-Jul-10,EL_PINO,EHALEY@YAHOO.COM +1270,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,09-Dec-20,ELIZABETH_JONES,F,27-Mar-09,CASEROS,DOMINIQUEPAGE@GMAIL.COM +1271,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,09-Dec-20,ERIC_CLARK,M,05-Jan-72,ALTO_GRANDE,HEATHERNGUYEN@HOTMAIL.COM +1272,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,09-Dec-20,LAUREN_CLEMENTS,F,08-Feb-89,AGUSTONI,PETERROMERO@GMAIL.COM +1273,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,09-Dec-20,RYAN_JONES,M,13-Dec-37,COLONIA_LA_YERBA,MARK29@HOTMAIL.COM +1274,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,09-Dec-20,CHRISTOPHER_WARD,M,26-Jan-14,AGUA_COLORADA,CHERYL77@GMAIL.COM +1275,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,09-Dec-20,ANDREA_MOODY,F,22-Dec-96,BERRETTA,ROBERTSOTO@HOTMAIL.COM +1276,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,09-Dec-20,AMY_HICKS,F,18-Feb-18,AGUA_AMARILLA_LA_HOYADA,ZRILEY@GMAIL.COM +1277,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,09-Dec-20,BRIANA_GONZALEZ,F,04-Aug-87,CAPITAN_SOLARI,HARRISMIKE@GMAIL.COM +1278,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,09-Dec-20,CHRISTY_NAVARRO,F,08-Nov-96,ANTA_CHICA,TONY37@HOTMAIL.COM +1279,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,09-Dec-20,JENNIFER_JONES,F,14-Jul-43,CHANILAO,CHRISTOPHERROSE@GMAIL.COM +1280,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,10-Dec-20,JEREMIAH_SINGLETON,M,19-Oct-05,ARROYO_FEDOR,JENNIFERBARTLETT@YAHOO.COM +1281,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,10-Dec-20,DIANE_GUZMAN,F,17-Apr-53,ARROYO_DEL_CURA,WILLIAMSAMANDA@HOTMAIL.COM +1282,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,10-Dec-20,CRYSTAL_CANTRELL,F,27-Dec-02,FARO_SAN_ANTONIO,JESSICA77@HOTMAIL.COM +1283,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,10-Dec-20,CHERYL_CRUZ,F,18-Mar-51,BANFIELD,CHARLENEBARKER@GMAIL.COM +1284,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,10-Dec-20,ROBERT_LAWRENCE,M,16-Jul-05,LA_BANDA,DOMINGUEZSCOTT@HOTMAIL.COM +1285,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,10-Dec-20,MICHELLE_SHAW,F,01-May-19,CAMINO_CENTENARIO_KM_11500,RAYMOND31@YAHOO.COM +1286,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,10-Dec-20,BETH_CAREY,F,30-Aug-77,BALSA_SENILLOSA,KEITHOWENS@GMAIL.COM +1287,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,10-Dec-20,CHRISTINE_WILLIAMS,F,23-Sep-31,CUCHA_CUCHA,ANGEL92@YAHOO.COM +1288,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,10-Dec-20,JAMES_JOHNSON,M,18-Jan-99,ALDEA_BELEIRO,PACHECODEAN@YAHOO.COM +1289,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,10-Dec-20,JUAN_TAYLOR,M,10-Apr-42,BAJASTINE,JULIEHENRY@HOTMAIL.COM +1290,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,10-Dec-20,ROBERT_GRAVES,M,03-Oct-13,BUEN_PASTO,DSPARKS@YAHOO.COM +1291,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,10-Dec-20,SHAWN_TUCKER,M,07-Aug-01,LA_ISABEL,BARNETTVALERIE@YAHOO.COM +1292,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,10-Dec-20,DESIREE_CURTIS,F,25-Mar-09,BALNEARIO_LOS_ANGELES,ANDREW22@GMAIL.COM +1293,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,10-Dec-20,DENISE_SANCHEZ,F,12-Nov-14,LA_ISABEL,HILLADAM@GMAIL.COM +1294,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,10-Dec-20,RACHEL_RAMOS,F,20-Aug-59,COLONIA_LAS_YESCAS,YWALLER@YAHOO.COM +1295,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,11-Dec-20,MIKE_SHARP,M,16-Oct-54,CROTTO,ZHOOPER@YAHOO.COM +1296,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,11-Dec-20,TAMMY_FLORES,F,02-Aug-61,COLONIA_LA_INDIA,MICHAEL50@HOTMAIL.COM +1297,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,11-Dec-20,ROBERT_NICHOLSON_DDS,M,28-Dec-84,ALCARAZ_2DO,COURTNEYLEWIS@GMAIL.COM +1298,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,11-Dec-20,RYAN_SMITH,M,20-Dec-42,MUÑIZ,CINDY93@GMAIL.COM +1299,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,11-Dec-20,WILLIAM_KIRK,M,27-Oct-42,AMAMBAY,FRANK65@HOTMAIL.COM +1300,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,11-Dec-20,ROBERT_MUELLER,M,11-Jan-98,SEY,JONESSTEPHEN@GMAIL.COM +1301,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,11-Dec-20,PHILIP_ROBINSON,M,18-Jul-99,ALDEA_FORESTAL,TYLERTURNER@GMAIL.COM +1302,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,12-Dec-20,MARY_CONNER,F,27-Apr-61,ARROYO_CASCO,WMARSH@GMAIL.COM +1303,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,12-Dec-20,JONATHAN_JOHNSON,M,27-Jan-28,COLONIA_ABATE,FWILSON@HOTMAIL.COM +1304,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,12-Dec-20,MICHELLE_FLOYD,F,25-Sep-32,ALBERTI,ANGELAPARSONS@GMAIL.COM +1305,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,12-Dec-20,TROY_CHRISTIAN,M,05-Apr-11,AGUA_BLANCA,LVAZQUEZ@GMAIL.COM +1306,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,12-Dec-20,PATRICIA_GARCIA,F,27-Dec-15,ESTACION_DE_ZOOTECNIA_B,CARTERJUAN@HOTMAIL.COM +1307,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,12-Dec-20,ASHLEE_PETERSON,F,18-Feb-46,OLASCOAGA,BRYANWELLS@GMAIL.COM +1308,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,12-Dec-20,ASHLEY_ROBINSON,F,10-Nov-96,BME_BAVIO_GRAL_MANSILLA,GARYBENNETT@YAHOO.COM +1309,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,12-Dec-20,MARY_GREEN,F,17-Mar-09,COLONIA_SAN_FRANCISCO,CHRISTINARICHARDSON@YAHOO.COM +1310,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,12-Dec-20,JOEL_RICHARDSON,M,14-Jan-85,ARRAYANAL,SINGLETONJAMES@YAHOO.COM +1311,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,12-Dec-20,RYAN_TURNER,M,26-Jul-28,10_DE_MAYO,HEATHERHARRIS@YAHOO.COM +1312,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,12-Dec-20,JUSTIN_CHASE,M,20-Apr-47,CABILDO,WJONES@HOTMAIL.COM +1313,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,12-Dec-20,LISA_MCBRIDE,F,17-Oct-20,ALZAGA,THOMPSONCRAIG@HOTMAIL.COM +1314,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,13-Dec-20,GLENN_MEZA,M,14-Jun-17,BAJO_DE_RACO,JHART@YAHOO.COM +1315,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,13-Dec-20,ERIC_RANDOLPH,M,03-Feb-14,CAMINERA,DESTINYCOLLINS@HOTMAIL.COM +1316,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,13-Dec-20,JASON_FROST,M,01-Jan-82,FARO_QUERANDI,AMANDAPEARSON@YAHOO.COM +1317,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,13-Dec-20,ANN_MCKEE,F,16-Apr-15,COLONIA_CENTENARIO,KRISTYTAYLOR@YAHOO.COM +1318,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,13-Dec-20,DOUGLAS_GONZALEZ,M,17-Feb-04,ORIENTE,LAURABALL@HOTMAIL.COM +1319,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,13-Dec-20,CHARLES_RIVERA,M,09-Mar-35,COLONIA_ENSANCHE_SAUCE,DAVIDCURRY@HOTMAIL.COM +1320,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,13-Dec-20,MARK_LEWIS,M,25-Jul-66,ISLA_GRAN_MALVINA,ZFROST@GMAIL.COM +1321,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,13-Dec-20,DANIEL_CRAIG,M,05-Sep-45,COMODORO_PY,QDENNIS@YAHOO.COM +1322,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,13-Dec-20,ETHAN_PERRY,M,17-Mar-49,ISLA_TIGRE,DIANARUSSELL@YAHOO.COM +1323,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,13-Dec-20,BRYAN_KANE,M,22-Sep-15,MANUEL_OCAMPO,WEAVERRODNEY@GMAIL.COM +1324,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,14-Dec-20,JORDAN_HERRING,F,16-Feb-58,CORBETT,GONZALEZSHAWN@GMAIL.COM +1325,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,14-Dec-20,GREGORY_SPARKS,M,09-Sep-55,ALDEA_SAN_GREGORIO,MARIAMITCHELL@GMAIL.COM +1326,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,14-Dec-20,MELISSA_CRAIG,F,14-May-39,ALTO_DEL_MOLLE,EKLEIN@GMAIL.COM +1327,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,14-Dec-20,TERESA_NAVARRO,F,02-Oct-67,TRUJUI,ANDREAGARDNER@GMAIL.COM +1328,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,14-Dec-20,HEATHER_AVILA,F,01-Nov-13,EL_DURAZNO,GRAHAMRYAN@HOTMAIL.COM +1329,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,14-Dec-20,JOHN_LUCAS,M,10-Apr-58,CAMPO_DE_VILLAMIL,WRAMIREZ@GMAIL.COM +1330,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,14-Dec-20,JAMES_CONLEY,M,31-Oct-84,ALMACEN_LA_COLINA,APRILBELL@YAHOO.COM +1331,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,14-Dec-20,HENRY_JONES,M,03-May-89,MESON_DE_FIERRO,MORRISCRAIG@GMAIL.COM +1332,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,14-Dec-20,RONALD_DAVIS,M,24-Feb-50,PELLEGRINI,RICKYSELLERS@HOTMAIL.COM +1333,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,14-Dec-20,JASON_MOORE,M,16-Feb-61,AGUAS_BUENAS,JESSICA38@HOTMAIL.COM +1334,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,14-Dec-20,JOHN_LITTLE,M,06-Feb-81,CAMPO_DE_LOS_TOROS,JSMITH@YAHOO.COM +1335,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,15-Dec-20,MARK_KLEIN,M,13-Aug-92,ARENAZA,JOSHUABENNETT@HOTMAIL.COM +1336,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,15-Dec-20,CHERYL_JACOBS,F,03-Mar-94,COLONIA_ABATE,VINCENT49@YAHOO.COM +1337,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,15-Dec-20,TRACY_YOUNG,F,11-Jan-26,CAÑADON_SECO,HTHOMAS@HOTMAIL.COM +1338,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,15-Dec-20,SAVANNAH_RODRIGUEZ,F,25-Mar-26,DESAMPARADOS,AMYCABRERA@HOTMAIL.COM +1339,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,15-Dec-20,CHLOE_WILSON,F,05-Apr-03,ALDEA_BRASILERA,DONALD67@YAHOO.COM +1340,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,15-Dec-20,SHELBY_FITZGERALD,F,26-Mar-75,BAÑOS_PISMANTA,NICHOLSSAMANTHA@HOTMAIL.COM +1341,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,15-Dec-20,CHRISTINE_CARLSON,F,24-Nov-10,FLORIDA,MICHAELSMITH@GMAIL.COM +1342,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,15-Dec-20,ROBERT_MCCARTY,M,22-Feb-60,LANDETA,ROMERODEVIN@HOTMAIL.COM +1343,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,15-Dec-20,MONIQUE_CRUZ,F,16-Feb-08,AIMOGASTA,DEREK19@GMAIL.COM +1344,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,15-Dec-20,TYLER_COLE,M,04-Jun-95,COLONIA_LA_INDIA,WILLIAMPHILLIPS@GMAIL.COM +1345,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,15-Dec-20,NICOLE_JORDAN,F,04-Oct-95,AMENABAR,TERESAALVAREZ@YAHOO.COM +1346,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,16-Dec-20,TYLER_SULLIVAN,M,02-Dec-60,LA_LUCILA_DEL_MAR,RENEE54@GMAIL.COM +1347,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,16-Dec-20,JONATHAN_MARTIN,M,11-Feb-67,ALDAO,NMILLS@YAHOO.COM +1348,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,16-Dec-20,MICHEAL_STEIN,M,10-Feb-85,ACHAVAL_RODRIGUEZ,DIAZRONALD@HOTMAIL.COM +1349,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,16-Dec-20,PATRICIA_WILLIAMS,F,26-Oct-81,BOWEN,ALEC92@GMAIL.COM +1350,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,16-Dec-20,ALLEN_LUNA,M,14-Oct-06,ALMACEN_EL_DESCANSO,CORY21@HOTMAIL.COM +1351,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,16-Dec-20,LAURA_MEJIA,F,24-Oct-99,DIEGO_LOPEZ,DEBRASULLIVAN@GMAIL.COM +1352,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,16-Dec-20,AMBER_GARCIA,F,16-Jul-51,HOSPITAL_NECOCHEA,WILKINSJOHN@GMAIL.COM +1353,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,16-Dec-20,DAVID_OLIVER,M,08-Jan-24,ARMSTRONG,PENNINGTONJASON@HOTMAIL.COM +1354,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,16-Dec-20,LAUREN_BAKER,F,26-May-05,BAJO_GRANDE,SSTEWART@HOTMAIL.COM +1355,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,16-Dec-20,PAMELA_WEBER,F,27-Jan-07,CAMPO_COLIQUEO,TINACOOPER@GMAIL.COM +1356,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,16-Dec-20,COLLEEN_WARNER,F,10-Oct-93,VILLA_ADELINA,GENEBYRD@YAHOO.COM +1357,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,16-Dec-20,KRISTINE_DAWSON,F,13-Nov-61,AERO_CLUB_ROSARIO,DAWN66@YAHOO.COM +1358,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,17-Dec-20,JORDAN_BRADFORD,F,19-Apr-45,NORDELTA,DESIREETHOMPSON@YAHOO.COM +1359,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,17-Dec-20,CHRISTOPHER_MEZA,M,11-Sep-08,COLONIA_LOTE_12,CORDOVAPAUL@YAHOO.COM +1360,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,17-Dec-20,KIMBERLY_DAVIS,F,06-Jan-14,KILOMETRO_208,VTHOMAS@HOTMAIL.COM +1361,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,17-Dec-20,TRAVIS_DECKER,M,11-Jun-56,AN_AIKE,VBROWNING@GMAIL.COM +1362,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,17-Dec-20,BRANDY_HOOD,F,25-Oct-93,CAPAYAN,CHRISTOPHER28@YAHOO.COM +1363,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,17-Dec-20,KEVIN_GRAY,M,24-Oct-53,9_DE_JULIO,EBOWMAN@HOTMAIL.COM +1364,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,17-Dec-20,DAVID_MERCADO,M,08-Jul-25,CACHIYUYAL,BRANDY46@GMAIL.COM +1365,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,17-Dec-20,JUSTIN_MARTINEZ_MD,M,02-Mar-12,CAVOUR,CRAWFORDJOEL@GMAIL.COM +1366,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,17-Dec-20,VERONICA_MILLER,F,17-Dec-89,ESTACION_USPALLATA,BRIANWILLIAMS@YAHOO.COM +1367,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,17-Dec-20,MELISSA_PARKS,F,22-Dec-33,ALTO_DEL_SALVADOR,BRENDAN00@GMAIL.COM +1368,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,17-Dec-20,HOLLY_TURNER,F,28-Dec-97,ANECON_GRANDE,WILSONLOGAN@YAHOO.COM +1369,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,17-Dec-20,JEFF_BRYANT,M,12-Dec-19,CARAPACHAY,CRAIG17@GMAIL.COM +1370,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,17-Dec-20,BRUCE_GARCIA,M,05-Aug-26,CACIQUE_ARIACAIQUIN,FBAKER@HOTMAIL.COM +1371,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,17-Dec-20,MARK_HOLT,M,12-Mar-82,ARSENAL_DE_GUERRA_SAN_LORENZO,AUSTIN38@HOTMAIL.COM +1372,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,17-Dec-20,KRISTA_HOLDEN,F,31-Aug-53,SARANDI,MARCUSWARE@GMAIL.COM +1373,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,17-Dec-20,NICHOLAS_LAWRENCE,M,02-Jul-09,GRACIARENA,XJOHNSON@YAHOO.COM +1374,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,18-Dec-20,BRITTANY_SMITH,F,22-May-76,COLONIA_DUPORTAL,BRIANMENDEZ@YAHOO.COM +1375,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,18-Dec-20,DYLAN_HARVEY,M,04-Dec-01,CAMPO_PEÑA_LOPEZ,RUTH99@YAHOO.COM +1376,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,18-Dec-20,KATHLEEN_CARTER,F,02-Sep-73,LA_FLORENCIA,CBEAN@HOTMAIL.COM +1377,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,18-Dec-20,XAVIER_SMITH,M,02-Mar-56,AVANZADA,JONATHANSMITH@YAHOO.COM +1378,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,18-Dec-20,WHITNEY_ROBINSON,F,05-Jan-46,LANGUEYU,MICHAEL10@YAHOO.COM +1379,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,18-Dec-20,DANIELLE_HALL,F,01-Jun-17,ESTELA,JORDANSEAN@YAHOO.COM +1380,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,18-Dec-20,BRIANNA_LONG,F,15-Apr-32,BAHIA_LANGARA,JENNIFER40@YAHOO.COM +1381,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,18-Dec-20,JENNY_VANCE,F,18-Dec-71,FUNKE,ZMIDDLETON@GMAIL.COM +1382,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,18-Dec-20,SHERYL_MARTINEZ,F,28-Nov-01,AN_AIKE,TUCKERALLISON@GMAIL.COM +1383,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,18-Dec-20,RYAN_PETERSON,M,19-Nov-55,ISLA_VICTORIA,LKELLY@YAHOO.COM +1384,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,18-Dec-20,AARON_BISHOP,M,29-Aug-06,COLONIA_CALIFORNIA,JONATHAN81@YAHOO.COM +1385,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,18-Dec-20,MARK_JOHNSON,M,05-Jul-43,EL_CHALTEN,MWILLIAMS@YAHOO.COM +1386,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,18-Dec-20,BARBARA_MCDONALD,F,09-Dec-37,COLONIA_BELGA_AMERICANA,MARIAGARZA@GMAIL.COM +1387,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,18-Dec-20,ALLISON_MARSHALL,F,17-Apr-75,CAÑADA_DE_LAS_VACAS,BARTONJOHN@GMAIL.COM +1388,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,18-Dec-20,BETHANY_HERNANDEZ,F,07-Apr-80,LLAVALLOL,DEBORAHTAYLOR@GMAIL.COM +1389,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,18-Dec-20,NATHAN_FRANKLIN,M,11-May-58,ALTO_DE_LAS_ARAÑAS,BRITTANYFORBES@GMAIL.COM +1390,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,19-Dec-20,RACHEL_RIVERA,F,28-Nov-98,RIO_MAYO,HGALLEGOS@GMAIL.COM +1391,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,19-Dec-20,MICHAEL_LEWIS,M,17-Mar-70,TRISTAN_SUAREZ,WILLIAMSMATTHEW@GMAIL.COM +1392,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,19-Dec-20,KIMBERLY_HENDERSON,F,07-May-62,LA_TRANCA,FSTEWART@GMAIL.COM +1393,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,19-Dec-20,KIM_SILVA,F,20-Mar-43,FARO_SAN_ANTONIO,IVAN36@GMAIL.COM +1394,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,19-Dec-20,RANDALL_CLINE,M,10-Jul-09,ARIJON,HAYESDANIEL@YAHOO.COM +1395,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,19-Dec-20,RAYMOND_HUDSON,M,24-Jan-86,LOMAS_DEL_MIRADOR,AMANDAJENSEN@YAHOO.COM +1396,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,19-Dec-20,GILBERT_HANSON,M,11-Feb-00,EL_JUMEAL,JANICELOPEZ@YAHOO.COM +1397,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,19-Dec-20,JORDAN_JOSEPH,M,19-Apr-40,COLONIA_CELINA,YSMITH@YAHOO.COM +1398,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,19-Dec-20,BRANDON_SCHULTZ,M,27-Feb-11,COLONIA_BELGA_AMERICANA,DALE02@GMAIL.COM +1399,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,19-Dec-20,JUSTIN_NGUYEN,M,09-Dec-84,EST_JAUREGUI_VA_FLANDRIA,POROZCO@HOTMAIL.COM +1400,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,19-Dec-20,SUSAN_ELLIOTT,F,28-Nov-88,SUNDBLAD,WILLIAM67@GMAIL.COM +1401,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,20-Dec-20,AMANDA_ROGERS,F,18-Sep-77,ADOLFO_VAN_PRAET,NATASHA58@GMAIL.COM +1402,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,20-Dec-20,DAVID_WEST,M,19-Apr-69,AMAMBAY,JESSICA85@YAHOO.COM +1403,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,20-Dec-20,JASON_WOOD,M,14-Apr-89,ARROYO_LAS_MINAS,DONNA48@GMAIL.COM +1404,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,20-Dec-20,SARAH_SIMON,F,02-Jun-52,COLONIA_TACURALES,KEVIN81@GMAIL.COM +1405,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,20-Dec-20,FRANCISCO_SWEENEY,M,03-Jul-43,AGUADA_DE_LAS_TEJAS,RMCINTOSH@HOTMAIL.COM +1406,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,20-Dec-20,COURTNEY_MALONE,F,07-Apr-77,CERANA,JASONADAMS@GMAIL.COM +1407,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,20-Dec-20,ROBERT_BECK,M,03-Jun-06,COLONIA_BARGA,RANDYADAMS@YAHOO.COM +1408,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,21-Dec-20,CHRISTINE_ARCHER,F,19-Jul-86,ESTACION_CHRISTOPHERSEN,RCOLEMAN@GMAIL.COM +1409,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,21-Dec-20,TAMMY_SUTTON,F,18-Jun-52,FRANCISCO_MADERO,CHARLES28@HOTMAIL.COM +1410,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,21-Dec-20,DUSTIN_ANDERSON,M,26-Apr-11,COLONIA_HINOJO,HHOFFMAN@GMAIL.COM +1411,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,21-Dec-20,LORI_WRIGHT,F,26-Jan-16,CAPILLA_DEL_SEÑOR,ROBIN14@HOTMAIL.COM +1412,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,21-Dec-20,MARIE_PARK,F,18-Mar-00,ARROYO_FEDOR,JEFFGOMEZ@YAHOO.COM +1413,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,21-Dec-20,CHRISTOPHER_MORRIS,M,20-Mar-13,AVENA,JSMITH@YAHOO.COM +1414,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,21-Dec-20,DONNA_HORN,F,24-Oct-51,VILLANI,XMITCHELL@HOTMAIL.COM +1415,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,21-Dec-20,ANTHONY_HODGES,M,23-Mar-82,ATREUCO,NRODRIGUEZ@HOTMAIL.COM +1416,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,21-Dec-20,SUSAN_WILCOX,F,30-Nov-92,CORONEL_ISLEÑOS,ALEXANDER72@HOTMAIL.COM +1417,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,21-Dec-20,MARIAH_GRIFFITH,F,18-Jul-64,ALPACHIRI,ROBERTBERG@YAHOO.COM +1418,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,21-Dec-20,RONNIE_SHORT_JR.,M,15-Aug-11,AGUADA_GRANDE,XNGUYEN@HOTMAIL.COM +1419,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,22-Dec-20,JULIE_MARTIN,F,28-Sep-12,ESTACION_USPALLATA,SANDOVALCHRISTY@YAHOO.COM +1420,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,22-Dec-20,JESSICA_BRANCH,F,17-Apr-48,AGUA_DEL_SIMBOL,PERRYASHLEY@GMAIL.COM +1421,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,22-Dec-20,KEITH_MCFARLAND,M,19-Nov-28,ARBOL_VERDE,FRANKWIGGINS@GMAIL.COM +1422,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,22-Dec-20,JILL_WOODS,F,25-Oct-84,EL_ZORRO,ROBERTJONES@HOTMAIL.COM +1423,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,22-Dec-20,JOHN_PARKER,M,10-Oct-94,PUESTO_DE_ISLA,JOHNPERRY@GMAIL.COM +1424,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,22-Dec-20,SUSAN_ROSS,F,19-Sep-07,BOQUERON,BROOKEBULLOCK@GMAIL.COM +1425,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,22-Dec-20,DEBORAH_WRIGHT,F,23-Jan-76,ARROYO_DE_LA_VENTANA,WHITNEYGARZA@YAHOO.COM +1426,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,22-Dec-20,ROBERT_REILLY,M,05-Dec-69,AGUILARES,BRADFORDSHAWN@HOTMAIL.COM +1427,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,22-Dec-20,SABRINA_MOODY,F,08-Feb-11,ARIEL,VPAYNE@GMAIL.COM +1428,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,22-Dec-20,MRS._ELIZABETH_THOMPSON_DVM,F,29-Sep-08,BARCENA,PAULAWINTERS@GMAIL.COM +1429,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,22-Dec-20,DAVID_PETERSON,M,14-Oct-08,EL_PIMPOLLO,WILLIAM33@GMAIL.COM +1430,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,22-Dec-20,BRANDON_KENNEDY,M,21-Nov-10,LA_CHINACA,FRANCES05@HOTMAIL.COM +1431,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,23-Dec-20,PAUL_BARRON,M,13-Jul-12,COLONIA_NUEVA_MONTEVIDEO,NICHOLEMONTOYA@YAHOO.COM +1432,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,23-Dec-20,CHRISTOPHER_YORK,M,07-Oct-85,AGUA_DE_DIAZ,ADAMSKAYLEE@HOTMAIL.COM +1433,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,23-Dec-20,SAMUEL_SMITH,M,23-Jan-83,AMANA,CAROLYNBROWN@YAHOO.COM +1434,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,23-Dec-20,HECTOR_REYES,M,02-Jan-24,AGUA_DE_LOS_MANANTIALES,ANGELAMCCLAIN@YAHOO.COM +1435,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,23-Dec-20,ALBERT_MERCER,M,03-Feb-72,BAÑADO_NORTE,KHALL@GMAIL.COM +1436,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,23-Dec-20,RAYMOND_MOLINA,M,23-Mar-02,LA_LUCILA_DEL_MAR,CRYSTALHEBERT@HOTMAIL.COM +1437,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,23-Dec-20,ALEXIS_CARTER,F,20-Jun-15,EL_CAMOATI,LAURA35@YAHOO.COM +1438,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,23-Dec-20,SUSAN_BROWN,F,21-Feb-07,ALTO_CALILEGUA,DAVID34@HOTMAIL.COM +1439,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,23-Dec-20,NICHOLAS_MENDOZA,M,10-Jul-06,ABRAMO,HALLDILLON@YAHOO.COM +1440,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,23-Dec-20,MARY_WHITE,F,23-Jul-75,CHOVET,NICHOLAS19@GMAIL.COM +1441,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,23-Dec-20,EMILY_JOHNSON,F,21-Jun-67,COLONIA_EL_POTRERO,CHRISTIANREYNOLDS@YAHOO.COM +1442,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,23-Dec-20,JAMIE_HART,F,08-Feb-07,IRENEO_PORTELA,MMEDINA@GMAIL.COM +1443,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,24-Dec-20,MIRANDA_ZUNIGA,F,28-Dec-74,CABRED,STEPHENTORRES@GMAIL.COM +1444,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,24-Dec-20,ANN_NGUYEN,F,06-Jan-82,LA_PUNTA,ALEX32@GMAIL.COM +1445,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,24-Dec-20,JOHN_JOHNSON,M,08-Nov-03,APOSTOLES,XDIAZ@GMAIL.COM +1446,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,24-Dec-20,CAROLYN_ROBINSON,F,09-Oct-50,EDUARDO_COSTA,SHERRYMCBRIDE@YAHOO.COM +1447,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,24-Dec-20,ROBERT_MCDANIEL,M,15-Jul-54,CALCHAQUI,SCOTTMICHAEL@YAHOO.COM +1448,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,24-Dec-20,BRADLEY_BARNES,M,29-Oct-07,COLONIA_VELEZ,LOVEVICTOR@HOTMAIL.COM +1449,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,24-Dec-20,AARON_SOTO,M,01-Jul-42,CALERA,KRISTIRICHARDSON@HOTMAIL.COM +1450,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,24-Dec-20,TRAVIS_MEADOWS,M,11-Dec-08,JOSE_FERRARI,YCAMACHO@HOTMAIL.COM +1451,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,24-Dec-20,VANESSA_HARRIS,F,04-Mar-92,9_DE_JULIO,NATHAN71@YAHOO.COM +1452,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,24-Dec-20,PATRICIA_COWAN,F,26-Jan-16,BARCALA,BRIANA86@HOTMAIL.COM +1453,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,24-Dec-20,STEPHEN_WALL,M,19-Aug-68,BETBEDER,RMOORE@YAHOO.COM +1454,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,24-Dec-20,MARK_HAMILTON,M,17-Nov-03,ABRA_BAYA,ANDERSONROBERT@GMAIL.COM +1455,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,24-Dec-20,KELLY_SMITH,F,02-Nov-00,CAMPO_DE_LOS_ANDES,VANESSA75@HOTMAIL.COM +1456,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,24-Dec-20,MICHAEL_HANSON,M,17-May-44,EMPALME_VILLA_CONSTITUCION,MILLERCODY@YAHOO.COM +1457,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,25-Dec-20,ANTHONY_DIAZ,M,11-Apr-72,BLANDENGUES,XORTIZ@HOTMAIL.COM +1458,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,25-Dec-20,WILLIAM_HOWARD,M,30-Nov-54,KILOMETRO_77,JZAMORA@YAHOO.COM +1459,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,25-Dec-20,NANCY_LIVINGSTON,F,23-Feb-41,DEL_VALLE,CORTEZBRITTANY@YAHOO.COM +1460,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,25-Dec-20,NICHOLAS_KING,M,07-Aug-47,ALARCON,BROOKSSARAH@GMAIL.COM +1461,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,25-Dec-20,LAURIE_SMITH,F,30-Dec-52,CUARTEL_IV,LINDSAYHENRY@HOTMAIL.COM +1462,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,25-Dec-20,ANDREW_SOTO,M,19-Sep-22,9_DE_JULIO,MADDOXEUGENE@GMAIL.COM +1463,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,25-Dec-20,JOSEPH_HEBERT,M,19-Jan-90,BARRIO_BELGRANO,WILLISAMY@HOTMAIL.COM +1464,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,25-Dec-20,DR._KATHLEEN_BARBER,F,31-Jul-76,B_LOS_AROMOS_SAN_PATRICIO,KATHERINEFARLEY@HOTMAIL.COM +1465,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,25-Dec-20,FRANK_HALE,M,06-Nov-13,CAMPO_RAFFO,CASTILLORONALD@GMAIL.COM +1466,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,25-Dec-20,BOBBY_MOORE,M,30-Nov-45,CENTENARIO,JAMESGREGORY@GMAIL.COM +1467,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,25-Dec-20,ALICIA_HARDIN,F,12-Apr-52,CAÑADA_RICA,KRISTINA68@HOTMAIL.COM +1468,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,25-Dec-20,THOMAS_STEWART,M,14-Apr-56,ACONQUIJA,STHOMAS@YAHOO.COM +1469,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,25-Dec-20,KAYLA_WEBB,F,28-Feb-95,BENITEZ,JOCELYN85@YAHOO.COM +1470,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,25-Dec-20,JAY_SULLIVAN,M,06-Aug-07,COLONIA_AROCENA_INA,VCOOK@HOTMAIL.COM +1471,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,25-Dec-20,CYNTHIA_CARNEY,F,21-May-56,BARRIALITOS,WILSONKIMBERLY@YAHOO.COM +1472,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,26-Dec-20,WENDY_NELSON,F,02-Jan-46,BERRAONDO,NHILL@GMAIL.COM +1473,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,26-Dec-20,APRIL_HANSEN,F,24-Aug-11,COLONIA_ABORIGEN,DEBORAHMILLER@YAHOO.COM +1474,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,26-Dec-20,HALEY_SCOTT,F,06-May-04,EL_CAMOATI,MATTHEWRODGERS@GMAIL.COM +1475,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,26-Dec-20,MR._JOSEPH_ONEAL,M,10-Apr-46,HITO_45,LEWISCHRISTOPHER@HOTMAIL.COM +1476,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,26-Dec-20,BRYAN_MEDINA,M,14-Jun-10,CAMPO_DE_LOS_ANDES,NANCYMORTON@HOTMAIL.COM +1477,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,26-Dec-20,ANDREA_MCKEE,F,27-Jun-21,VILLANI,AMANDA01@HOTMAIL.COM +1478,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,26-Dec-20,BENJAMIN_HUGHES,M,27-Dec-21,EL_PEREGRINO,ANGELA56@HOTMAIL.COM +1479,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,26-Dec-20,AUDREY_DILLON,F,12-Aug-13,PASO_DEL_REY,JENSENJENNIFER@GMAIL.COM +1480,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,26-Dec-20,ANGELA_ANDERSON,F,01-Jan-87,CANTERA_AGUIRRE,SMITHDAVID@YAHOO.COM +1481,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,26-Dec-20,DAVID_MCCOY,M,24-Dec-05,ALARCON,YADAMS@HOTMAIL.COM +1482,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,26-Dec-20,MARY_TUCKER,F,31-May-94,LA_GAMA,YSHAW@HOTMAIL.COM +1483,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,27-Dec-20,RACHEL_MASON,F,10-Feb-73,CAÑADA_DE_GOMEZ,GARZAPATRICIA@HOTMAIL.COM +1484,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,27-Dec-20,CHARLES_JONES,M,04-Dec-95,ALGARROBO,PYOUNG@HOTMAIL.COM +1485,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,27-Dec-20,ALEX_HURLEY,M,28-Nov-43,ABRA_MAYO,CAROLYN25@GMAIL.COM +1486,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,27-Dec-20,PATRICIA_MORRIS,F,30-Dec-61,COLONIA_RIVAS,WOLFDANIELLE@HOTMAIL.COM +1487,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,27-Dec-20,DANIEL_NELSON,M,02-Oct-74,VILLA_ANGELICA,ASALAZAR@HOTMAIL.COM +1488,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,27-Dec-20,BROOKE_BUSH,F,17-Feb-15,CARCARAÑA,ISAACFORD@HOTMAIL.COM +1489,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,27-Dec-20,AMANDA_ROBERTS,F,02-Nov-44,ANTONIO_CARBONI,STAYLOR@HOTMAIL.COM +1490,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,27-Dec-20,OMAR_BALDWIN,M,05-Jul-98,BECCAR,RICHARD61@YAHOO.COM +1491,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,27-Dec-20,DAVID_KAISER,M,18-Jan-99,CAPITAN_SOLARI,LEROYDAVIS@GMAIL.COM +1492,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,27-Dec-20,RICHARD_BANKS,M,07-Sep-91,CAÑADON_CALIENTE,GMORRIS@YAHOO.COM +1493,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,27-Dec-20,LOGAN_LAWRENCE,M,10-Apr-62,LA_ISABEL,HAMILTONSTEVEN@GMAIL.COM +1494,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,27-Dec-20,CHARLES_BAUTISTA,M,04-Dec-03,VILLA_OLIVARI,COLEMANMICHAEL@GMAIL.COM +1495,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,27-Dec-20,DAVID_COX_II,M,19-Apr-12,EL_JAGUEL,DALTONSTACEY@HOTMAIL.COM +1496,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,27-Dec-20,TRACY_PARKER,F,24-May-13,AGUA_COLORADA,QPERKINS@GMAIL.COM +1497,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,27-Dec-20,CAITLIN_LONG,F,12-Aug-08,BENAVIDEZ,JENNIFER24@GMAIL.COM +1498,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,27-Dec-20,SARA_DIAZ,F,27-Feb-58,BARTOLOME_MITRE,AMBERMARTIN@GMAIL.COM +1499,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,27-Dec-20,SHERI_FITZGERALD,F,07-Apr-28,ITURRASPE,TAYLOROBRIEN@GMAIL.COM +1500,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,28-Dec-20,ANTHONY_CLEMENTS,M,25-May-59,10_DE_MAYO,JOSEPHHALE@HOTMAIL.COM +1501,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,28-Dec-20,KRISTIE_SHAFFER,F,13-Oct-15,EDMUNDO_PERKINS,REBECCAHOUSTON@HOTMAIL.COM +1502,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,28-Dec-20,JACOB_DODSON,M,15-Jul-91,AGUA_DE_LA_PIEDRA,ANDREA35@YAHOO.COM +1503,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,28-Dec-20,GABRIEL_ALEXANDER,M,15-May-33,CAMPO_CALVO,ROBERT79@HOTMAIL.COM +1504,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,28-Dec-20,LORI_MOORE,F,23-Oct-82,CANDELARIA_SUD,BRIANRIVERS@GMAIL.COM +1505,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,28-Dec-20,ALEXANDER_SIMMONS,M,26-Jun-18,CAMPO_MOISES_SECCION_1A,BETTY02@YAHOO.COM +1506,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,28-Dec-20,DANA_HARTMAN,F,04-Feb-57,AGUAS_CALIENTES,WILLIAMRAMOS@HOTMAIL.COM +1507,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,28-Dec-20,JOSE_THOMPSON,M,09-Apr-35,AMPACAMA,HUTCHINSONKAREN@HOTMAIL.COM +1508,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,28-Dec-20,LISA_BENNETT,F,07-Aug-65,CAMPO_COUBERT,MAXWELLLAUREN@HOTMAIL.COM +1509,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,28-Dec-20,REGINA_HUTCHINSON,F,27-Mar-60,CASTILLA,SIMPSONMICHELLE@HOTMAIL.COM +1510,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,28-Dec-20,MEAGAN_JONES,F,20-May-56,ACASSUSO,THEODOREMOORE@YAHOO.COM +1511,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,29-Dec-20,LAURA_HERNANDEZ,F,29-May-30,AGUA_AMARGA,SMILLER@GMAIL.COM +1512,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,29-Dec-20,EDGAR_STUART,M,10-Feb-78,OLASCOAGA,OSTEPHENS@GMAIL.COM +1513,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,29-Dec-20,DARLENE_ESTRADA,F,16-Apr-49,CARAGUATAY,DYLAN54@GMAIL.COM +1514,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,29-Dec-20,WILLIAM_CARTER,M,13-Sep-60,FLORENCIO_VARELA,AMCCLURE@GMAIL.COM +1515,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,29-Dec-20,STEPHANIE_HARRIS,F,04-Sep-91,FRANCISCO_CASAL,JOSEPHROGERS@GMAIL.COM +1516,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,29-Dec-20,TERESA_REED,F,27-Oct-23,AGUA_BLANCA,GJOHNSON@GMAIL.COM +1517,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,29-Dec-20,KEVIN_JENKINS,M,09-Aug-08,VIRREY_DEL_PINO,JACQUELINE90@YAHOO.COM +1518,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,29-Dec-20,HANNAH_GUERRERO,F,21-Dec-22,LUIS_CHICO,BRYANHOWELL@GMAIL.COM +1519,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,29-Dec-20,TIMOTHY_MORENO,M,01-Feb-34,9_DE_JULIO_KILOMETRO_20,PETERSONCHRISTIAN@YAHOO.COM +1520,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,29-Dec-20,PAULA_DAVIS,F,10-Jun-72,ALUMINE,REBECCA60@YAHOO.COM +1521,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,29-Dec-20,NANCY_WHITE,F,30-Dec-11,EL_DURAZNO,YLEON@GMAIL.COM +1522,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,30-Dec-20,KAREN_BELL,F,10-Mar-36,CASBAS,JAMESHOWE@GMAIL.COM +1523,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,30-Dec-20,CYNTHIA_ROBERTS,F,04-Feb-61,ESTACION_CORONEL_PRINGLES,URODRIGUEZ@HOTMAIL.COM +1524,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,30-Dec-20,BRENDA_RAMOS,F,14-Nov-76,LAS_TONINAS,SMORGAN@YAHOO.COM +1525,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,30-Dec-20,JESSICA_SMITH,F,22-Dec-58,CEBALLOS,WALKERCHRISTOPHER@HOTMAIL.COM +1526,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,30-Dec-20,RICHARD_MCKNIGHT,M,04-Jun-26,LA_PELADA,MOOREWENDY@GMAIL.COM +1527,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,30-Dec-20,DONALD_MERCER,M,24-Apr-27,30_DE_AGOSTO,RYAN73@YAHOO.COM +1528,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,30-Dec-20,JENNIFER_STONE,F,22-Aug-61,PASO_DE_LOS_ANDES,ANNBASS@HOTMAIL.COM +1529,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,30-Dec-20,MATTHEW_HENDERSON,M,19-Sep-70,COSTA_DEL_ESTE,SAMUELHODGE@HOTMAIL.COM +1530,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,30-Dec-20,CHARLES_DAVIS,M,12-May-94,CHAMICAL,STEPHEN62@HOTMAIL.COM +1531,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,31-Dec-20,ANDREW_ARROYO,M,23-Dec-03,ARROYO_DULCE,CHARLES81@GMAIL.COM +1532,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,31-Dec-20,MICHAEL_WRIGHT,M,26-Jun-10,CAMINERA,WELCHRANDY@HOTMAIL.COM +1533,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,31-Dec-20,TRACY_BROWN,F,25-Jan-63,BARRIO_GARIN_NORTE,YFLOWERS@GMAIL.COM +1534,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,31-Dec-20,CHRISTOPHER_MORALES,M,18-Feb-88,ALEGRIA,KPARK@HOTMAIL.COM +1535,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,31-Dec-20,RODNEY_GARCIA,M,23-Jul-19,CAÑADA_LA_NEGRA,KATIE74@GMAIL.COM +1536,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,31-Dec-20,THERESA_THOMPSON,F,08-Dec-27,PEREZ,ALLENMICHELLE@GMAIL.COM +1537,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,31-Dec-20,MELISSA_WILEY,F,15-Apr-24,EL_TREBOL,WAREBRITTANY@HOTMAIL.COM +1538,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,31-Dec-20,JENNIFER_WILLIAMS,F,01-May-79,EL_CARBALINO,XHURST@HOTMAIL.COM +1539,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,31-Dec-20,NANCY_LEWIS,F,02-Aug-22,BELLA_VISTA,THERESAMORALES@YAHOO.COM +1540,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,31-Dec-20,JAMIE_CARPENTER,F,09-Jan-07,ALIANZA,DCLARK@YAHOO.COM +1541,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,01-Jan-21,CHARLES_MARSH,M,10-Mar-69,ARENAZA,MARQUEZTIMOTHY@GMAIL.COM +1542,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,01-Jan-21,JENNIFER_ABBOTT,F,03-Jun-58,ARAÑITA,CASSANDRAJONES@GMAIL.COM +1543,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,01-Jan-21,BRADLEY_LEE,M,12-Jan-43,ADOLFO_GONZALES_CHAVES,KEVINPARKS@GMAIL.COM +1544,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,01-Jan-21,JOSEPH_ELLIOTT,M,11-Nov-09,ARROYO_LAS_MINAS,KEITH02@GMAIL.COM +1545,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,01-Jan-21,ERIN_LUNA,F,28-Feb-05,AGUADA_DEL_LORO,JENNIFERBURKE@GMAIL.COM +1546,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,01-Jan-21,JAMES_SCHMIDT,M,01-Feb-38,AGUADITA,ADAMSMICHELE@GMAIL.COM +1547,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,01-Jan-21,JULIAN_CHAVEZ,M,31-Dec-67,CAMPO_PESOA,SHAWREBECCA@YAHOO.COM +1548,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,01-Jan-21,LESLIE_GALLAGHER,F,27-Nov-34,ALANICES,CHRISTINA46@YAHOO.COM +1549,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,01-Jan-21,SHAWN_ALVARADO,M,18-Jun-73,ALDECON,KELLYYANG@YAHOO.COM +1550,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,01-Jan-21,SHELBY_REED,F,12-Feb-26,CHAVARRIA,CHRISTINE71@GMAIL.COM +1551,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,01-Jan-21,BARBARA_SMITH,F,12-Nov-16,MERCADO_CENTRAL,EPETERS@HOTMAIL.COM +1552,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,01-Jan-21,ALAN_BLANCHARD,M,05-Dec-77,CAMPO_GARABATO,DEANTHOMAS@HOTMAIL.COM +1553,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,01-Jan-21,TAYLOR_THOMAS,M,21-Jun-27,ABRA_DE_HINOJO,THOMPSONRICHARD@GMAIL.COM +1554,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,02-Jan-21,SHAWN_CAIN,M,10-Mar-17,INGENIERO_HUERGO,CHENERIC@YAHOO.COM +1555,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,02-Jan-21,MARIA_MANNING,F,02-Mar-19,BARRIO_LA_UNION,DIANECRUZ@YAHOO.COM +1556,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,02-Jan-21,AARON_BURKE,M,24-Dec-83,CARRIZALES,NATHANIEL14@GMAIL.COM +1557,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,02-Jan-21,KAYLEE_DIAZ,F,09-Feb-43,CHICHAGASTA,BRENDAHERNANDEZ@YAHOO.COM +1558,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,02-Jan-21,DONALD_HALL,M,14-Dec-12,ANDALUCIA,PATRICIA33@HOTMAIL.COM +1559,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,02-Jan-21,ADRIENNE_LEVY,F,08-Nov-07,AZOPARDO,TYLERHALL@YAHOO.COM +1560,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,02-Jan-21,JOSHUA_FARRELL,M,20-Jun-76,ALDAO,BIRDERICA@HOTMAIL.COM +1561,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,02-Jan-21,KEVIN_JIMENEZ,M,25-Dec-83,CAZON,LBRADFORD@HOTMAIL.COM +1562,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,02-Jan-21,MICHAEL_GIBBS,M,12-May-38,AGUADA_GRANDE,KENNETHWEST@GMAIL.COM +1563,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,03-Jan-21,RICHARD_GRIFFIN,M,16-May-85,ISLA_TIGRE,CLINTONTHOMAS@YAHOO.COM +1564,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,03-Jan-21,AMANDA_GARCIA,F,16-Dec-60,BARRIO_LA_UNION,LORI54@GMAIL.COM +1565,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,03-Jan-21,JONATHAN_HERRERA,M,07-Jun-22,BAJO_GRANDE,NATALIE43@YAHOO.COM +1566,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,03-Jan-21,JAMES_ACEVEDO,M,11-Nov-82,ALISOS__DE_ABAJO,CURRYKRISTINA@HOTMAIL.COM +1567,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,03-Jan-21,JULIE_MCDANIEL,F,17-Nov-90,ARROYO_HONDO,BENJAMIN37@HOTMAIL.COM +1568,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,03-Jan-21,RANDALL_ROBINSON,M,13-May-01,ANGOSTURA,CRYSTALVELASQUEZ@GMAIL.COM +1569,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,03-Jan-21,SIERRA_BAUER,F,09-Dec-15,CAPILLA_GUADALUPE_NORTE,ORTEGAMICHAEL@YAHOO.COM +1570,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,03-Jan-21,ERIKA_PARKER,F,09-Dec-19,GONZALEZ_MORENO,REYESSARA@HOTMAIL.COM +1571,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,03-Jan-21,CRYSTAL_BENNETT,F,06-Oct-72,ALMIRANTE_IRIZAR,MOLLYPORTER@HOTMAIL.COM +1572,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,03-Jan-21,ROBERT_BUCHANAN,M,11-Jul-67,AVENA,LAURA48@GMAIL.COM +1573,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,03-Jan-21,MR._GREGORY_MAXWELL,M,27-Oct-12,LA_TRANCA,DANIELREYNOLDS@HOTMAIL.COM +1574,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,04-Jan-21,KELLY_MARTIN,F,03-Oct-06,EL_REMANSO,BETH74@YAHOO.COM +1575,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,04-Jan-21,LUCAS_WEBSTER,M,28-May-28,CAPITAN_CASTRO,CRISTIAN06@HOTMAIL.COM +1576,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,04-Jan-21,BRIAN_SANDERS,M,07-Mar-21,LARRECHEA,TIFFANY12@YAHOO.COM +1577,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,04-Jan-21,MARVIN_MEDINA,M,20-Apr-09,PILAR,SHEILAPUGH@GMAIL.COM +1578,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,04-Jan-21,STEPHEN_WAGNER,M,29-Apr-65,BARRIO_EL_TONTAL,SEAN72@GMAIL.COM +1579,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,04-Jan-21,CHARLES_VEGA,M,17-Jan-36,CHOCORI,JEANNE36@HOTMAIL.COM +1580,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,04-Jan-21,JEREMY_CAMPBELL,M,28-Jul-55,CAMPO_CLUCELLAS,JESSICA22@HOTMAIL.COM +1581,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,04-Jan-21,AMY_SMITH,F,27-Jul-62,COLONIA_PUJOL,IJOHNSON@GMAIL.COM +1582,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,04-Jan-21,RICHARD_BROOKS,M,03-Oct-43,ARANA,LESLIECHANDLER@YAHOO.COM +1583,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,04-Jan-21,KIRSTEN_FERGUSON,F,06-Aug-08,CESPEDES,CHRISTOPHERHALL@HOTMAIL.COM +1584,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,04-Jan-21,ERIC_GREENE,M,29-Jun-33,CLAYPOLE,JANICEROBERTSON@GMAIL.COM +1585,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,04-Jan-21,ROBERT_DEAN,M,09-Jun-72,ESTRADA,RONALD73@GMAIL.COM +1586,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,04-Jan-21,VICKI_HAWKINS,F,16-Sep-82,ESTACION_SAGUIER,KELSEYPERRY@GMAIL.COM +1587,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,04-Jan-21,WILLIAM_MOORE,M,26-May-30,AMERICA,VHOLMES@YAHOO.COM +1588,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,04-Jan-21,LISA_HAYES,F,04-Jun-47,COLONIA_CUNCI,JGRAHAM@HOTMAIL.COM +1589,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,04-Jan-21,PATRICK_HARPER,M,05-Aug-73,COLONIA_DURAN,YBOND@HOTMAIL.COM +1590,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,04-Jan-21,DONALD_BARTON,M,16-Jun-28,SAN_ISIDRO,CAMERON82@GMAIL.COM +1591,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,04-Jan-21,LAURA_REESE,F,09-May-19,INGENIERO_ADOLFO_SOURDEAUX,DOMINIQUE68@HOTMAIL.COM +1592,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,04-Jan-21,KIMBERLY_WILLIAMS,F,03-Jun-35,ARROYO_SECO,HEATHER24@HOTMAIL.COM +1593,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,04-Jan-21,BROOKE_LEE,F,14-Oct-93,ANGEL_GALLARDO,ZJONES@YAHOO.COM +1594,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,04-Jan-21,ROBERT_GONZALEZ,M,29-Mar-15,ALGARROBO,JOSE28@GMAIL.COM +1595,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,05-Jan-21,MARISSA_WHITE,F,28-Jul-92,PASO_DE_LOS_ANDES,NICHOLASLANE@YAHOO.COM +1596,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,05-Jan-21,KEVIN_SANCHEZ,M,09-Nov-11,GAHAN,NOAHDUNN@YAHOO.COM +1597,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,05-Jan-21,SHELBY_JOHNSON,F,15-Apr-46,ANZOATEGUI,GEOFFREYFLEMING@GMAIL.COM +1598,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,05-Jan-21,NANCY_DANIELS,F,27-Feb-11,CAÑADA_DE_LAS_OVEJAS,PHYLLIS56@GMAIL.COM +1599,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,05-Jan-21,LARRY_WANG,M,06-Sep-55,LA_ISABEL,SHUNT@YAHOO.COM +1600,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,05-Jan-21,TERRY_OSBORN,M,19-Dec-72,ALMACEN_CASTRO,ZROWE@HOTMAIL.COM +1601,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,05-Jan-21,TERRY_AGUILAR,F,02-Mar-34,LA_EDUVIGIS,BMCGUIRE@YAHOO.COM +1602,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,05-Jan-21,STEPHEN_NICHOLSON,M,12-Sep-36,EL_TALA,WILKINSONEBONY@GMAIL.COM +1603,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,05-Jan-21,CRYSTAL_BAXTER,F,17-Sep-52,ARROYO_PASTORA,YOUNGKEVIN@HOTMAIL.COM +1604,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,05-Jan-21,RYAN_LEWIS,M,27-Nov-64,ALDEA_SANTA_MARIA,KKENT@GMAIL.COM +1605,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,05-Jan-21,SYLVIA_PROCTOR,F,13-Sep-18,BAHIA_SAN_BLAS,QBELL@YAHOO.COM +1606,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,05-Jan-21,TERRY_STEWART,F,24-Nov-83,ALGARROBO_DEL_AGUILA,MICHAEL23@GMAIL.COM +1607,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,05-Jan-21,ASHLEY_ORR,F,19-Nov-81,LOMAS_DEL_MIRADOR,TYLER04@HOTMAIL.COM +1608,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,06-Jan-21,CAROLYN_WONG,F,21-Jul-80,AGUAS_BUENAS,EEATON@YAHOO.COM +1609,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,06-Jan-21,LAURA_JONES,F,16-May-89,RINCON_DE_MILBERG,DONALD97@HOTMAIL.COM +1610,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,06-Jan-21,RYAN_ACOSTA,M,27-Apr-36,LUIS_CHICO,MADISONWOODS@GMAIL.COM +1611,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,06-Jan-21,DAVID_COLLINS,M,04-Jul-00,BERISSO,PAMELABENJAMIN@GMAIL.COM +1612,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,06-Jan-21,DONNA_MORENO,F,05-Jul-55,CARLOS_KEEN,UPITTMAN@YAHOO.COM +1613,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,06-Jan-21,DEVIN_LEWIS,M,15-Jul-27,EMPALME_FRONTERA,MARGARET60@GMAIL.COM +1614,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,06-Jan-21,CRYSTAL_BOWMAN,F,06-Mar-26,AGUA_DE_CASTILLA,JONATHAN51@GMAIL.COM +1615,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,06-Jan-21,NICOLE_WARE,F,08-Aug-22,NELSON,CWILLIAMS@HOTMAIL.COM +1616,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,06-Jan-21,SCOTT_MITCHELL,M,17-Jun-93,CASTILLA,NATALIESTEVENSON@HOTMAIL.COM +1617,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,06-Jan-21,TAMMY_WIGGINS,F,17-Dec-86,CHAPANAY,SARAHWILSON@YAHOO.COM +1618,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,06-Jan-21,JENNIFER_CLARK,F,08-Apr-13,JESUS_MARIA,JOHN42@GMAIL.COM +1619,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,06-Jan-21,NICHOLE_FLORES,F,07-Jun-11,COLONIA_LOS_SAUCES,COLLINSSTEPHEN@GMAIL.COM +1620,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,06-Jan-21,ERIKA_HOWARD,F,27-Feb-19,CHAVARRIA,BUTLERANN@YAHOO.COM +1621,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,07-Jan-21,MR._BRIAN_JONES,M,30-May-01,ACARAGUA,LOPEZTONI@HOTMAIL.COM +1622,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,07-Jan-21,KELLY_YOUNG,F,23-Jun-00,ARROYO_SALADO,RODGERSCHRISTOPHER@YAHOO.COM +1623,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,07-Jan-21,SAMANTHA_SHARP,F,23-Aug-65,25_DE_MAYO,VARGASERICA@GMAIL.COM +1624,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,07-Jan-21,KATHRYN_BATES,F,25-Oct-04,ESTANCIAS,MILLERNICOLE@YAHOO.COM +1625,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,07-Jan-21,DEBORAH_KING,F,02-Jul-16,LAGUNA_DEL_BARRO,YCAMPOS@GMAIL.COM +1626,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,07-Jan-21,ANDREA_TORRES,F,06-Apr-07,FRANCISCO_ALVAREZ,ROBERTSMITH@YAHOO.COM +1627,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,07-Jan-21,SANDRA_PALMER,F,21-Jun-15,GREGORIO_DE_LAFERRERE,DAVIDBENTLEY@HOTMAIL.COM +1628,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,07-Jan-21,JEREMY_LOWE,M,19-Aug-30,ABRA_PAMPA,GARRISONPENNY@YAHOO.COM +1629,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,07-Jan-21,KELLY_COHEN,F,27-Feb-72,LA_CALIFORNIA,DAWN60@GMAIL.COM +1630,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,07-Jan-21,TERRY_MONROE,M,20-Mar-17,ACOSTILLA,SIMSCAROLYN@GMAIL.COM +1631,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,07-Jan-21,DANIEL_BRYANT,M,14-Feb-29,BAJO_HONDO,BONNIEWHITNEY@YAHOO.COM +1632,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,07-Jan-21,MELISSA_YOUNG,F,16-May-02,AZOPARDO,JAREDROBLES@HOTMAIL.COM +1633,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,07-Jan-21,MICHAEL_PEREZ,M,18-Feb-36,JUAN_E_BARRA,SMITHMICHELLE@HOTMAIL.COM +1634,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,07-Jan-21,PATRICIA_GROSS,F,31-Jul-16,COSTA_DEL_NOGOYA,LISASHEPHERD@GMAIL.COM +1635,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,08-Jan-21,NATASHA_CHAN,F,23-Aug-61,11_DE_MAYO,SWOOD@GMAIL.COM +1636,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,08-Jan-21,KAREN_WOODWARD_DDS,F,20-May-11,ALEGRIA,RANDALLCASEY@HOTMAIL.COM +1637,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,08-Jan-21,MARK_HILL,M,07-Mar-77,BLAQUIER,HJORDAN@GMAIL.COM +1638,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,08-Jan-21,LINDA_ANDERSON,F,20-May-49,COLIQUEO,JENNIFER80@YAHOO.COM +1639,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,08-Jan-21,SIERRA_CASEY,F,24-Oct-98,ARMINDA,WALLERPATRICK@GMAIL.COM +1640,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,08-Jan-21,LINDA_GOODWIN,F,08-Nov-57,PIAMONTE,DIXONCHRISTINA@YAHOO.COM +1641,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,08-Jan-21,MERCEDES_WILLIAMS,F,30-Apr-96,LOTE_11_ESCUELA_107,RYATES@HOTMAIL.COM +1642,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,08-Jan-21,SARAH_LARSON,F,15-Aug-26,BARRIO_LENCINA,PETERSONJANET@GMAIL.COM +1643,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,08-Jan-21,CLAUDIA_SULLIVAN,F,24-Oct-35,MONTE_CHINGOLO,PLAMBERT@HOTMAIL.COM +1644,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,08-Jan-21,JACK_RYAN,M,12-Nov-68,LAVALLE,WOODMELVIN@YAHOO.COM +1645,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,08-Jan-21,ROBERT_DAVIS,M,09-Jun-11,AVANZADA,NLAWSON@GMAIL.COM +1646,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,08-Jan-21,SCOTT_LEWIS,M,27-Feb-65,ESTACION_LAGO_EPECUEN,BROWNMARY@HOTMAIL.COM +1647,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,08-Jan-21,LISA_RIVERA,F,18-Aug-41,VILLA_EL_CHOCON,DANIEL42@GMAIL.COM +1648,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,08-Jan-21,ANTHONY_WALL,M,04-Dec-54,ALTO_VERDE,JOHNSONMARVIN@YAHOO.COM +1649,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,09-Jan-21,NICHOLAS_CISNEROS,M,27-Dec-99,EL_ZAPALLAR,RODNEYCOOLEY@HOTMAIL.COM +1650,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,09-Jan-21,ALEX_SIMPSON,M,21-Dec-20,BUEN_PASTO,LEONARD70@YAHOO.COM +1651,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,09-Jan-21,AUSTIN_KLINE_DVM,M,05-Jun-40,CORTADERAS,DUNCANJEFFREY@HOTMAIL.COM +1652,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,09-Jan-21,ELIZABETH_STONE,F,15-Apr-06,CUARTEL_V,NVILLANUEVA@HOTMAIL.COM +1653,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,09-Jan-21,SARAH_WEBB,F,04-Nov-72,ARROYO_BALMACEDA,JEFFREYROGERS@YAHOO.COM +1654,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,09-Jan-21,JERRY_EDWARDS,M,23-Aug-67,APARICIO_CUE,JSIMMONS@GMAIL.COM +1655,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,09-Jan-21,JULIE_ROSE,F,04-Mar-93,VILLANI,VFOX@HOTMAIL.COM +1656,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,09-Jan-21,LEAH_MORENO,F,04-Feb-30,KILOMETRO_125,SJONES@GMAIL.COM +1657,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,09-Jan-21,KENNETH_RODGERS,M,04-Jan-94,ESTACION_MORENO,SEANHUNTER@HOTMAIL.COM +1658,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,10-Jan-21,TAYLOR_HARMON,F,22-Aug-11,HARAS_SAN_JACINTO,HENDRICKSGARY@GMAIL.COM +1659,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,10-Jan-21,BETH_ANDERSON,F,17-Nov-33,BUEN_RETIRO,WEAVERMAUREEN@GMAIL.COM +1660,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,10-Jan-21,VALERIE_SWANSON,F,13-Oct-20,EL_JUPITER,KIMBERLY05@HOTMAIL.COM +1661,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,10-Jan-21,EVELYN_WOODS,F,22-Jun-97,ALGARROBAL,PJOHNSON@YAHOO.COM +1662,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,10-Jan-21,TYLER_WALKER,M,11-Feb-11,KILOMETRO_125,KELLIRIVERA@GMAIL.COM +1663,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,10-Jan-21,DOUGLAS_NGUYEN,M,05-Jul-31,ACEILAN,VALERIE00@HOTMAIL.COM +1664,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,10-Jan-21,ELIZABETH_YATES,F,28-Apr-61,AGUADITA,STEVENTHOMAS@GMAIL.COM +1665,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,11-Jan-21,JORDAN_STEIN,F,25-May-39,BARRIO_LA_UNION,XROBERTS@YAHOO.COM +1666,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,11-Jan-21,PATRICIA_BENNETT,F,06-Sep-21,FRANCISCO_CASAL,KAREN85@GMAIL.COM +1667,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,11-Jan-21,TRAVIS_KELLEY,M,15-May-23,COLIQUEO,MICHAEL43@HOTMAIL.COM +1668,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,11-Jan-21,RICHARD_KING,M,03-Mar-83,ALISOS__DE_ABAJO,HKOCH@YAHOO.COM +1669,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,11-Jan-21,LYNN_LARSON,F,20-Jun-60,GENTE_GRANDE,KATHERINE10@YAHOO.COM +1670,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,11-Jan-21,JOHN_MUNOZ,M,09-Oct-51,9_DE_JULIO,ARTHUR66@GMAIL.COM +1671,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,11-Jan-21,DALE_ACOSTA,M,28-Jun-35,ADRIAN_MATURANO,KENNEDYAPRIL@YAHOO.COM +1672,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,11-Jan-21,JONATHAN_MCCLURE,M,19-Oct-55,ACEILAN,RAYMONDDAVENPORT@GMAIL.COM +1673,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,11-Jan-21,ANNA_BRAY,F,23-Feb-44,ALMA_GRANDE,BOWMANSTEPHANIE@HOTMAIL.COM +1674,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,11-Jan-21,JAMIE_PALMER,F,04-Sep-82,CURANDU,AMY18@GMAIL.COM +1675,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,11-Jan-21,JANET_BURKE,F,21-Aug-15,ALASTUEY,BROWNCRYSTAL@GMAIL.COM +1676,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,11-Jan-21,HEIDI_WOOD,F,10-Feb-12,EL_CENIZO,HOLSEN@HOTMAIL.COM +1677,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,12-Jan-21,DEBORAH_BARRY,F,27-Mar-35,CAMPO_SABATE,EHUNT@HOTMAIL.COM +1678,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,12-Jan-21,TONY_FIGUEROA,M,16-Dec-11,TEMPERLEY,MICHELEWILLIAMS@GMAIL.COM +1679,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,12-Jan-21,CONNOR_MYERS,M,21-Nov-40,CABRED,CHRISTOPHERGONZALEZ@YAHOO.COM +1680,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,12-Jan-21,VALERIE_ROBINSON,F,15-Jan-77,ALCARAZ_NORTE,MATTHEWRAMIREZ@YAHOO.COM +1681,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,12-Jan-21,KIMBERLY_ALLEN,F,26-Feb-58,BASAIL,ANGELA43@YAHOO.COM +1682,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,12-Jan-21,MONICA_GOODWIN,F,03-Jun-17,PASO_DE_LOS_ANDES,GARROYO@YAHOO.COM +1683,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,12-Jan-21,DANIEL_CAMPBELL,M,11-May-09,LAVALLE,MARTIN19@GMAIL.COM +1684,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,12-Jan-21,PAUL_COX,M,18-Jan-48,ANTONIO_CARBONI,DAVID15@YAHOO.COM +1685,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,12-Jan-21,MACKENZIE_WILLIAMS,F,20-Jul-47,EL_RETIRO,NHAMPTON@GMAIL.COM +1686,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,12-Jan-21,JULIE_CARTER,F,28-Apr-20,LAS_PALMAS,ANDREWAGNER@YAHOO.COM +1687,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,12-Jan-21,DR._DONNA_DAVID_DVM,F,30-Jan-10,COLONIA_LOS_ZAPALLOS,JACOB43@HOTMAIL.COM +1688,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,13-Jan-21,WILLIAM_SMITH,M,09-Apr-20,BAÑADO_NORTE,FARRELLNATASHA@GMAIL.COM +1689,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,13-Jan-21,ERIC_TODD,M,28-Jul-43,ALGARROBO,JOHN50@HOTMAIL.COM +1690,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,13-Jan-21,HOLLY_RYAN,F,19-Dec-98,FRANCISCO_MADERO,POTTSEMMA@GMAIL.COM +1691,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,13-Jan-21,JENNIFER_HALE,F,20-Jul-38,AROMOS,KATHERINECAREY@YAHOO.COM +1692,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,13-Jan-21,STEVEN_SMITH,M,23-May-16,25_DE_MAYO,JASON52@GMAIL.COM +1693,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,13-Jan-21,MR._JEREMY_DUNLAP,M,17-Mar-19,CASCADA,ASHLEY15@GMAIL.COM +1694,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,13-Jan-21,JOHN_PATTERSON,M,21-Oct-80,COLONIA_AROCENA_INA,THOMASSCOTT@HOTMAIL.COM +1695,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,13-Jan-21,TIMOTHY_BROWN,M,13-Apr-99,SAN_MAYOL,REEDKIMBERLY@YAHOO.COM +1696,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,13-Jan-21,TROY_WALLACE,M,11-Jul-98,BUENA_VISTA,SALAZARJAMES@GMAIL.COM +1697,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,14-Jan-21,BETTY_BELL,F,25-Jan-11,LA_PASTORA,ANDREW40@HOTMAIL.COM +1698,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,14-Jan-21,ANDREW_MONTGOMERY,M,03-Jan-05,COSTA_BRAVA,KELLY23@HOTMAIL.COM +1699,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,14-Jan-21,NATHAN_PAYNE,M,10-Jun-40,ALTO_VERDE,MICHAELSMITH@YAHOO.COM +1700,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,14-Jan-21,DIANE_PIERCE,F,23-Feb-65,INGENIERO_ADOLFO_SOURDEAUX,MELISSA63@YAHOO.COM +1701,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,14-Jan-21,BRIAN_PADILLA,M,26-Mar-55,CAMPO_CARETTO,GINA16@HOTMAIL.COM +1702,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,14-Jan-21,KIMBERLY_GOLDEN,F,06-Jun-30,ARROYO_MANGANGA,JAMESBRADSHAW@YAHOO.COM +1703,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,14-Jan-21,JOHN_WARD,M,09-Dec-62,AVESTRUZ,CHADWILLIAMS@GMAIL.COM +1704,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,14-Jan-21,ROBERT_WASHINGTON_JR.,M,19-Jul-78,CRISTOLIA,MELISSAPHILLIPS@GMAIL.COM +1705,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,14-Jan-21,REGINA_MUNOZ,F,07-Nov-18,ALDEA_CHALECO,SARAHMAXWELL@HOTMAIL.COM +1706,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,14-Jan-21,GREGORY_LUNA,M,03-Dec-66,PIAMONTE,JASON78@HOTMAIL.COM +1707,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,14-Jan-21,STEPHANIE_ROSE,F,27-Jun-98,COSTA_BRAVA,MICHAEL72@YAHOO.COM +1708,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,14-Jan-21,SARAH_GONZALES,F,17-Apr-11,BARCENA,FIGUEROARICHARD@YAHOO.COM +1709,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,14-Jan-21,ROBERT_LUCAS,M,26-Jul-65,BARCENA,JAMES05@YAHOO.COM +1710,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,15-Jan-21,DAVID_HARRINGTON,M,15-Jul-08,INGENIERO_THOMPSON,ALEXANDERDAVID@HOTMAIL.COM +1711,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,15-Jan-21,JOSEPH_SMITH,M,11-Sep-34,COLONIA_HERNANDARIAS,BRAYCHERYL@HOTMAIL.COM +1712,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,15-Jan-21,NATALIE_BAXTER,F,03-Aug-59,BUENA_ESPERANZA,FREDERICK05@GMAIL.COM +1713,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,15-Jan-21,DONNA_MORRISON,F,03-Dec-42,CATAMONTAÑA,DENNIS36@HOTMAIL.COM +1714,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,15-Jan-21,SYDNEY_PRICE,F,12-Jun-36,PELLEGRINI,SINGLETONJOSHUA@YAHOO.COM +1715,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,15-Jan-21,CHRISTY_BURKE,F,20-Oct-42,ABO_NEZU,VALERIE17@GMAIL.COM +1716,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,15-Jan-21,NANCY_WARD_MD,F,22-Nov-30,GENERAL_RODRIGUEZ,EDWARDCOOPER@HOTMAIL.COM +1717,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,15-Jan-21,SUSAN_JOHNSON,F,06-May-83,CIPOLLETTI,MKRAMER@GMAIL.COM +1718,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,15-Jan-21,KEVIN_HOLT,M,07-Dec-38,JUAN_F_IBARRA,MSCHMIDT@HOTMAIL.COM +1719,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,15-Jan-21,MATTHEW_LEWIS,M,09-Aug-53,LOS_FRENTONES,MALIK58@GMAIL.COM +1720,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,15-Jan-21,ERICA_CHANG,F,08-Jan-15,BALSA_SENILLOSA,MICHAELSHIELDS@YAHOO.COM +1721,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,16-Jan-21,RACHEL_HUGHES,F,19-Dec-88,OCHO_VADOS,ADRIAN35@GMAIL.COM +1722,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,16-Jan-21,TIMOTHY_WARREN,M,19-Feb-19,LA_FLORENCIA,JOHNSONSHEENA@YAHOO.COM +1723,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,16-Jan-21,JAMES_ANDERSON,M,15-Nov-24,VILLA_SANTOS_TESEI,KAREN32@HOTMAIL.COM +1724,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,16-Jan-21,BRITTANY_GRIFFIN,F,25-Jun-89,SAN_GENARO_NORTE,JOHNARIAS@HOTMAIL.COM +1725,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,16-Jan-21,JOSEPH_NOVAK,M,29-Oct-54,ARROYO_ALELI,RYAN08@HOTMAIL.COM +1726,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,16-Jan-21,SARAH_YOUNG,F,05-Mar-06,AGUA_RICA,RWHITE@GMAIL.COM +1727,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,16-Jan-21,RACHEL_HARRIS,F,08-Oct-09,MAIPU,MCCARTHYFERNANDO@YAHOO.COM +1728,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,16-Jan-21,JEFFREY_FOSTER,M,16-Jan-93,ADAN_QUIROGA,UBENNETT@GMAIL.COM +1729,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,16-Jan-21,TROY_ROGERS,M,14-Nov-08,LA_TRANCA,RONALD06@GMAIL.COM +1730,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,16-Jan-21,MARCUS_HOLLAND,M,04-Jan-13,ARAUJO,WALKERSCOTT@HOTMAIL.COM +1731,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,16-Jan-21,WENDY_JENSEN,F,18-Dec-26,IRENEO_PORTELA,BECKY66@HOTMAIL.COM +1732,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,16-Jan-21,REBECCA_PUGH,F,10-Aug-03,B_LOS_AROMOS_SAN_PATRICIO,ALISHAENGLISH@YAHOO.COM +1733,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,16-Jan-21,KATHERINE_LANE,F,30-Apr-33,COLONIA_LA_INDIA,BRANGEL@GMAIL.COM +1734,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,17-Jan-21,MARK_MCCOY,M,02-Oct-17,BERDUC,SNYDERSARA@YAHOO.COM +1735,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,17-Jan-21,KRYSTAL_RODRIGUEZ,F,04-Feb-06,PORVENIR,HHALL@GMAIL.COM +1736,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,17-Jan-21,GINA_LEE,F,03-Oct-14,BARRA_BONITA,KARENROBERSON@GMAIL.COM +1737,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,17-Jan-21,KRISTY_COOPER,F,13-Apr-45,LOMAS_DEL_MIRADOR,KEVIN16@YAHOO.COM +1738,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,17-Jan-21,ANGELA_DAVIS,F,02-Dec-65,LONGCHAMPS,PHILLIP46@GMAIL.COM +1739,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,17-Jan-21,REBECCA_NIELSEN,F,12-Jul-10,ALIJILAN,OLIVIAREYNOLDS@HOTMAIL.COM +1740,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,17-Jan-21,PAUL_GRAHAM,M,01-Nov-91,CABRERIA,GREGORY66@GMAIL.COM +1741,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,17-Jan-21,KATHERINE_NELSON,F,01-Aug-97,BARRIO_BELGRANO,YCLAYTON@HOTMAIL.COM +1742,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,17-Jan-21,KEVIN_ROBINSON,M,18-Jun-24,CAMPO_GARAY,GONZALESELIZABETH@YAHOO.COM +1743,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,17-Jan-21,STEVEN_WILKINSON,M,18-May-66,CARLOS_SALAS,UANDERSON@GMAIL.COM +1744,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,17-Jan-21,MARGARET_VILLANUEVA,F,19-Jun-20,BAHIA_CREEK,RAVEN83@YAHOO.COM +1745,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,18-Jan-21,CYNTHIA_WILLIAMS,F,31-Oct-35,ANJULLON,JOHNSONTRAVIS@GMAIL.COM +1746,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,18-Jan-21,MARTHA_BROWN,F,09-Aug-78,ALPACHIRI,HMCGEE@GMAIL.COM +1747,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,18-Jan-21,JAMES_WHITAKER,M,16-Jul-68,CAMET,GREENJUAN@HOTMAIL.COM +1748,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,18-Jan-21,NICOLE_WILLIAMS,F,10-Dec-64,ARROYO_LAS_MINAS,LISACANTU@HOTMAIL.COM +1749,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,18-Jan-21,DUSTIN_STEWART,M,26-Jul-22,COLONIA_ALBERDI,SIMMONSEILEEN@HOTMAIL.COM +1750,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,18-Jan-21,SUSAN_JOHNSON,F,21-Apr-58,BONPLAND_NORTE,BROWNJAKE@GMAIL.COM +1751,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,18-Jan-21,GARY_CHANG,M,24-Feb-08,BOLIVAR,REGINA51@YAHOO.COM +1752,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,18-Jan-21,GREGORY_ADAMS,M,01-Feb-74,BARCENA,AWILLIAMS@GMAIL.COM +1753,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,19-Jan-21,MARK_GRIFFIN,M,20-May-75,LA_LEGUA,MCBRIDEREBECCA@YAHOO.COM +1754,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,19-Jan-21,NICHOLAS_JOHNSTON,M,29-May-29,RAMOS_MEJIA,BRANDONBURTON@HOTMAIL.COM +1755,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,19-Jan-21,ZACHARY_JENKINS,M,03-Aug-47,EL_ESPINILLO,BATESNORMA@GMAIL.COM +1756,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,19-Jan-21,KATHRYN_CLARK,F,16-Nov-15,ALMIRANTE_IRIZAR,HOLLY98@HOTMAIL.COM +1757,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,19-Jan-21,PATRICK_HILL,M,29-Jan-71,ALTAMIRA,JACOB66@GMAIL.COM +1758,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,19-Jan-21,CHAD_GARCIA,M,30-Sep-05,ZONA_DELTA_TIGRE,OMILLER@HOTMAIL.COM +1759,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,19-Jan-21,MEGAN_BRADLEY,F,13-Jun-91,BARCALA,DESTINY55@YAHOO.COM +1760,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,19-Jan-21,KRISTEN_JOHNSON,F,23-Oct-54,HUANQUEROS,FITZPATRICKERIC@GMAIL.COM +1761,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,19-Jan-21,MELISSA_ROMERO,F,21-Jan-98,EL_CIPRES,NICHOLASCHANDLER@GMAIL.COM +1762,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,19-Jan-21,RENEE_PATRICK,F,08-Sep-09,AVIA_TERAI,WILLIAMGAY@YAHOO.COM +1763,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,20-Jan-21,STEPHEN_TAYLOR,M,31-Jan-08,BALNEARIO_OCEANO,WENDYLONG@HOTMAIL.COM +1764,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,20-Jan-21,KIMBERLY_DAVENPORT,F,07-Dec-05,CERRO_SANTA_ANA,MCLAUGHLINCINDY@GMAIL.COM +1765,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,20-Jan-21,DERRICK_HAMMOND,M,15-Oct-51,CHOLILA,JAMIETANNER@HOTMAIL.COM +1766,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,20-Jan-21,STACEY_DURAN,F,11-Apr-97,CAMPO_UBAJO,GREENESTEVEN@HOTMAIL.COM +1767,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,20-Jan-21,CARL_KRAMER,M,19-Nov-51,AMBROSETTI,KRISTOPHER60@GMAIL.COM +1768,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,20-Jan-21,SANDY_BELTRAN,F,08-May-81,IRAOLA,MURPHYJENNIFER@GMAIL.COM +1769,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,20-Jan-21,CHELSEA_SMITH,F,28-Oct-08,TABLADA,NICOLEWALLACE@HOTMAIL.COM +1770,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,20-Jan-21,SHERYL_HEATH,F,02-Sep-14,ACASSUSO,IRUIZ@YAHOO.COM +1771,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,20-Jan-21,HEIDI_GARCIA,F,28-Jul-78,PUENTE_DEL_INCA,LORIHOLMES@YAHOO.COM +1772,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,20-Jan-21,WILLIAM_TAYLOR,M,17-Jun-60,CORONEL_BOERR,WHITEDANIELLE@YAHOO.COM +1773,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,20-Jan-21,LANCE_DYER,M,28-Feb-66,CLAVERIE,DUANEMARQUEZ@GMAIL.COM +1774,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,20-Jan-21,TODD_COHEN,M,30-Oct-29,CLAVERIE,JOHN29@HOTMAIL.COM +1775,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,20-Jan-21,MEGAN_PRICE,F,10-Dec-09,CAPDEPONT,GABRIEL10@HOTMAIL.COM +1776,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,20-Jan-21,BAILEY_CALDWELL,F,11-Dec-31,BAHIA_SAN_BLAS,ALLENKARA@GMAIL.COM +1777,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,21-Jan-21,GARY_KENNEDY,M,15-Apr-42,AGUADA_A_PIQUE,UMARQUEZ@YAHOO.COM +1778,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,21-Jan-21,SHANNON_SKINNER,F,30-Mar-30,20_DE_JUNIO,GARRETTMOORE@GMAIL.COM +1779,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,21-Jan-21,RICHARD_INGRAM,M,23-Oct-11,CARLOS_KEEN,MORTONSARAH@GMAIL.COM +1780,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,21-Jan-21,LINDA_BROWN,F,27-Jul-21,ARQUEDAS,VBAILEY@YAHOO.COM +1781,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,21-Jan-21,MEGAN_HERRERA,F,04-Jul-68,LLAVALLOL,ZCHAPMAN@HOTMAIL.COM +1782,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,21-Jan-21,ANDREA_GOODMAN,F,18-Apr-14,ESTANCIA_SANTA_CATALINA,NICOLEMCKAY@GMAIL.COM +1783,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,21-Jan-21,STEPHEN_CHARLES,M,16-Jan-49,AMPACAMA,TANDERSON@YAHOO.COM +1784,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,21-Jan-21,CAROL_ROBERSON,F,12-Dec-16,HUANQUEROS,ORANGEL@YAHOO.COM +1785,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,21-Jan-21,JUAN_BURGESS,M,14-Jan-12,9_DE_JULIO_KILOMETRO_20,RACHELLEWIS@YAHOO.COM +1786,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,21-Jan-21,MICHELLE_MILLER,F,11-Sep-07,ANTIGUO,SHAYES@YAHOO.COM +1787,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,21-Jan-21,JUSTIN_HARRIS,M,30-Jul-73,ALDEA_BRASILERA,WOODSBRIAN@GMAIL.COM +1788,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,21-Jan-21,ERIC_HARRINGTON,M,06-Aug-84,ESTANCIA_LAS_GAMAS,STEVENMCMILLAN@HOTMAIL.COM +1789,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,21-Jan-21,TANNER_MCCULLOUGH,M,19-Dec-17,CABURE,LISA28@YAHOO.COM +1790,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,22-Jan-21,MARIAH_DEAN,F,26-Oct-60,BERAZATEGUI,ZSWANSON@HOTMAIL.COM +1791,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_TERAPIA_OCUPACIONAL,22-Jan-21,CHRISTOPHER_BROWN,M,19-Nov-70,VALLE_HONDO,CLONG@HOTMAIL.COM +1792,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,22-Jan-21,PETER_BATES,M,11-Apr-39,AGUA_DE_DIONISIO,CARPENTERCARL@HOTMAIL.COM +1793,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,22-Jan-21,ANITA_ROWE,F,21-Apr-68,ALCORTA,MICHAELFIELDS@GMAIL.COM +1794,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,22-Jan-21,SARAH_JONES,F,03-Jun-29,DESPEÑADEROS,DANIELMILLER@YAHOO.COM +1795,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,22-Jan-21,JENNIFER_BONILLA,F,11-Mar-00,LA_COLINA,COXTIMOTHY@YAHOO.COM +1796,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,22-Jan-21,MELISSA_WARD,F,18-Aug-45,BAJO_CARACOLES,ERIK45@HOTMAIL.COM +1797,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,22-Jan-21,KIM_CARLSON,F,16-Dec-01,VILLA_NUMANCIA,TONYJACKSON@HOTMAIL.COM +1798,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,23-Jan-21,TAMMY_RIOS,F,16-Jul-44,BENAVIDEZ,HSHORT@HOTMAIL.COM +1799,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,23-Jan-21,JAMES_BROWN,M,22-Oct-11,CAMPO_CRENNA,BRANDON33@GMAIL.COM +1800,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,23-Jan-21,SEAN_GRIMES,M,15-Aug-81,11_DE_MAYO,JASMINEHALL@HOTMAIL.COM +1801,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,23-Jan-21,ANGELA_MYERS,F,28-Jun-66,ARROYO_MOREIRA,ALEXANDERHINTON@HOTMAIL.COM +1802,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,23-Jan-21,CHERYL_CAIN,F,26-Sep-06,ALTO_RIO_PICO,BELLCAITLIN@YAHOO.COM +1803,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,23-Jan-21,AMY_COPELAND,F,28-Jan-05,COLONIA_HARDY,JEREMYPOTTER@HOTMAIL.COM +1804,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,23-Jan-21,JOSEPH_BENNETT,M,12-Oct-96,ARROYO_DEL_PESCADO,JOHN96@HOTMAIL.COM +1805,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,23-Jan-21,MARK_RANDALL,M,20-Sep-87,CAMPAMENTO_SOL,DEBBIESIMPSON@HOTMAIL.COM +1806,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,23-Jan-21,WILLIAM_ELLIOTT,M,09-Dec-38,ANCON,RSUTTON@GMAIL.COM +1807,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,23-Jan-21,AMY_SMITH,F,18-Aug-83,CERRO_ACONCAGUA,ANDREW80@GMAIL.COM +1808,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,23-Jan-21,BRIAN_PEARSON,M,01-Aug-84,CENTRO_AGRICOLA_EL_PATO,OWHITE@GMAIL.COM +1809,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,23-Jan-21,DANIEL_FOX,M,07-Jun-52,ALDEA_SANTA_MARIA,WILLIAM62@GMAIL.COM +1810,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,23-Jan-21,JAMES_REYES,M,15-Jan-34,ARROYO_GRANDE,MICHEALRIOS@GMAIL.COM +1811,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,24-Jan-21,DIANE_WILLIAMS,F,19-Nov-13,CAPITAN_CASTRO,CASSANDRA44@HOTMAIL.COM +1812,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,24-Jan-21,DARRELL_HOLMES,M,13-Apr-47,SANCTI_SPIRITU,UJACKSON@GMAIL.COM +1813,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,24-Jan-21,HANNAH_WILLIAMS,F,20-Feb-78,LA_EDUVIGIS,AMBER07@HOTMAIL.COM +1814,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,25-Jan-21,THOMAS_DAVIS,M,26-May-90,HUANGUELEN,CLARKALEXIS@YAHOO.COM +1815,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,25-Jan-21,RUTH_MILLER,F,20-Jun-31,DEL_VISO,SABRINA79@HOTMAIL.COM +1816,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,25-Jan-21,BRENDA_HENRY,F,14-Nov-99,CASTELAR,BOOKERCHRISTOPHER@GMAIL.COM +1817,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,25-Jan-21,BENJAMIN_STUART_MD,M,16-Apr-57,BETBEDER,KATHLEENSANDERS@YAHOO.COM +1818,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,25-Jan-21,CRYSTAL_MONTGOMERY,F,11-Jul-62,BARRO_NEGRO,BJORDAN@GMAIL.COM +1819,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,25-Jan-21,VICTORIA_HIGGINS,F,26-Jul-93,ANTIGUO,WEBSTERBRADLEY@YAHOO.COM +1820,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,25-Jan-21,MICHAEL_HENDERSON,M,15-Jan-57,LOS_CORREDORES,DESIREETUCKER@YAHOO.COM +1821,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,26-Jan-21,CHERYL_JONES,F,20-Sep-21,ANTONIO_TOMAS,HOFFMANSANDRA@HOTMAIL.COM +1822,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,26-Jan-21,REBECCA_PRATT,F,21-Aug-37,AGUARA_GRANDE,STEPHANIEALEXANDER@HOTMAIL.COM +1823,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,26-Jan-21,TAMMY_FOX,F,11-Feb-98,CARAGUATAY,BGENTRY@GMAIL.COM +1824,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,26-Jan-21,DIANE_CLARK_DDS,F,06-Jul-34,ALDEA_ESCOLAR,YDUNCAN@YAHOO.COM +1825,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,26-Jan-21,TRACY_HERRERA,F,03-Dec-77,CACHIRULO,ANDREANELSON@HOTMAIL.COM +1826,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,26-Jan-21,DIANA_DAVENPORT,F,14-Jun-27,WHEELWRIGHT,JOEL88@GMAIL.COM +1827,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,26-Jan-21,RENEE_JUAREZ,F,20-Apr-20,BERAZATEGUI,CWU@HOTMAIL.COM +1828,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,26-Jan-21,TRAVIS_RIVERS,M,18-Feb-78,VILLA_ANGELICA,YCASTILLO@YAHOO.COM +1829,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,26-Jan-21,JOSEPH_STOKES,M,03-Jun-29,ARROYO_SALADO,CHARLESCOOK@GMAIL.COM +1830,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,26-Jan-21,CHRISTINE_RIOS,F,07-May-83,LAVALLE,XCHAPMAN@HOTMAIL.COM +1831,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PLANIFICACIÓN_Y_DISEÑO_DEL_PAISAJE,26-Jan-21,LINDA_REYES,F,15-Sep-04,BARROS_PAZOS,MILLERJOHN@HOTMAIL.COM +1832,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,26-Jan-21,MARCUS_REEVES,M,23-May-92,CLAYPOLE,EMMA33@HOTMAIL.COM +1833,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,26-Jan-21,DAVE_BAKER,M,05-Jan-06,EL_CENIZO,NREYES@YAHOO.COM +1834,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,26-Jan-21,KATHLEEN_SMITH,F,03-Jul-21,CORRALITO,COURTNEYSTEWART@GMAIL.COM +1835,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,26-Jan-21,MITCHELL_GONZALEZ,M,03-Nov-75,CAMINERA_LUJAN,JACKSONPATRICIA@GMAIL.COM +1836,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,27-Jan-21,MARK_BURNETT,M,05-Nov-18,ESTACION_SAGUIER,JACKSONKATIE@HOTMAIL.COM +1837,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,27-Jan-21,JESSICA_DAVIS,F,01-Apr-08,COLONIA_RIVAS,BRADLEY05@HOTMAIL.COM +1838,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,27-Jan-21,EMILY_SIMON,F,05-Jul-88,ARBOL_SOLO,XMOORE@HOTMAIL.COM +1839,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,27-Jan-21,JUDITH_MCCLAIN,F,03-Sep-53,25_DE_MAYO,MATAPAUL@YAHOO.COM +1840,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_AMBIENTALES,27-Jan-21,JUSTIN_MARTIN,M,16-Jan-02,COLONIA_LOMA_NEGRA,JERRY11@HOTMAIL.COM +1841,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,27-Jan-21,KIMBERLY_LEVY,F,21-Jan-09,CAÑADON_LEON,XMCCARTY@HOTMAIL.COM +1842,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_EDUCACIÓN_,27-Jan-21,KAYLA_FINLEY,F,07-Dec-44,CAZON,HALEY55@YAHOO.COM +1843,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,27-Jan-21,ALEXANDRA_PEREZ,F,04-Jul-01,PLANCHADA_BANDERITA,BELTRANKATHLEEN@GMAIL.COM +1844,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,27-Jan-21,WHITNEY_COWAN,F,19-May-57,CORONEL_BOERR,GPEREZ@YAHOO.COM +1845,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,27-Jan-21,THOMAS_CAMACHO,M,16-Jan-94,COSTA_GRANDE,YBROWN@GMAIL.COM +1846,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,27-Jan-21,BETH_FARRELL,F,11-Jul-04,CAMPO_PEÑA_LOPEZ,WALKERLISA@HOTMAIL.COM +1847,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,27-Jan-21,THOMAS_RODRIGUEZ,M,26-Mar-96,EL_PINGO,WENDY23@HOTMAIL.COM +1848,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,27-Jan-21,LISA_BRIDGES,F,15-Sep-07,CAMERON,TIMOTHYROBINSON@HOTMAIL.COM +1849,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,27-Jan-21,GARY_REESE,M,10-Aug-17,COLONIA_SAN_MANUEL,TONY25@HOTMAIL.COM +1850,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,28-Jan-21,CRYSTAL_ANDERSON,F,11-Mar-83,ALDEA_SAN_ANDRES,ANDREWSCHRISTOPHER@GMAIL.COM +1851,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,28-Jan-21,AMY_DAVIS,F,07-Oct-09,CAMPO_DE_TALAMAYO,PMILLER@YAHOO.COM +1852,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,28-Jan-21,JOSEPH_PATEL,M,06-Nov-07,ALISOS__DE_ABAJO,SANTOSSUSAN@GMAIL.COM +1853,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,28-Jan-21,BRADLEY_BROWN,M,12-Jul-57,COLONIA_LAS_YESCAS,VALERIECRAIG@YAHOO.COM +1854,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,28-Jan-21,KIM_DANIELS,F,19-May-91,CARAGUATA,LARRYWILSON@HOTMAIL.COM +1855,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,28-Jan-21,DR._NICOLE_ROBERTS,F,27-Sep-34,CAPDEPONT,GATESKATHERINE@GMAIL.COM +1856,UNIVERSIDAD_DEL_SALVADOR,BIOQUÍMICA,28-Jan-21,BETHANY_TRUJILLO,F,25-Jun-11,CORONEL_CHARLONE,MORENOCALEB@GMAIL.COM +1857,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,28-Jan-21,MELISSA_LOVE,F,21-Mar-33,GONZALEZ_CATAN,SARA98@GMAIL.COM +1858,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,29-Jan-21,RACHEL_WILSON,F,18-Aug-12,GRANADERO_BAIGORRIA,YOLANDABAKER@GMAIL.COM +1859,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,29-Jan-21,RANDY_ADKINS,M,17-Jan-83,ARROYO_DEL_MEDIO,MARGARETDELACRUZ@GMAIL.COM +1860,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,29-Jan-21,KEVIN_CALDERON,M,09-Feb-06,ALVAREZ_JONTE,ADAY@HOTMAIL.COM +1861,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,29-Jan-21,ABIGAIL_NEWTON,F,03-Jun-20,CHOCORI,PAULLEE@YAHOO.COM +1862,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,29-Jan-21,CATHERINE_MURPHY_DVM,F,24-Aug-16,ARROYO_CLARO,BRIANNADANIEL@GMAIL.COM +1863,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_BIOLÓGICAS,29-Jan-21,KATHLEEN_FITZPATRICK,F,29-Jul-65,VILLA_ANGELICA,JOSEPH47@GMAIL.COM +1864,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,29-Jan-21,NICHOLAS_SHAW,M,28-Nov-82,ACEILAN,MARYMASON@GMAIL.COM +1865,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,29-Jan-21,SARA_RAMSEY,F,12-Oct-54,BARRIO_GRAL_JOSE_DE_SAN_MARTIN,SELLERSSHANE@HOTMAIL.COM +1866,UNIVERSIDAD_DEL_SALVADOR,ARQUITECTURA,29-Jan-21,JANET_WYATT,F,14-Apr-71,CAMPO_COUBERT,WELLSMICHAEL@HOTMAIL.COM +1867,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,29-Jan-21,CHARLENE_ALLEN,F,21-Oct-70,ABASTO,ODONNELLEUGENE@GMAIL.COM +1868,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_INDUSTRIAL,30-Jan-21,KATELYN_ROSS,F,11-Jul-59,CAMPO_CHARO,PCLARKE@YAHOO.COM +1869,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,30-Jan-21,RACHAEL_DAVIDSON,F,06-Mar-67,ANGELITA,MORRISJERRY@GMAIL.COM +1870,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,30-Jan-21,MARIAH_MEYER,F,02-Jun-55,CALERA_ARGENTINA,SIMPSONBRIAN@GMAIL.COM +1871,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,30-Jan-21,JAMES_HAMPTON,M,03-Jan-37,LAVALLE,BWOOD@GMAIL.COM +1872,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,30-Jan-21,LISA_WEBB,F,03-Dec-45,MAORI,AMANDACABRERA@GMAIL.COM +1873,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PSICOLOGÍA,30-Jan-21,DANIEL_WHITE,M,25-May-55,VALENTIN_ALSINA,EHARRIS@YAHOO.COM +1874,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_ANTROPOLÓGICAS,30-Jan-21,LEAH_MILLER,F,26-May-42,AGUAS_BUENAS,KRISTIN83@YAHOO.COM +1875,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_ELECTRÓNICA,30-Jan-21,SARAH_YOUNG,F,30-Mar-25,CAMPO_DE_GALNASI,MELISSA85@HOTMAIL.COM +1876,UNIVERSIDAD_DEL_SALVADOR,CONTADOR_PÚBLICO_,30-Jan-21,STEVEN_PARKER,M,05-Jul-11,BERRETTA,JON09@HOTMAIL.COM +1877,UNIVERSIDAD_DEL_SALVADOR,MEDICINA,30-Jan-21,JOSHUA_LI,M,12-Dec-81,CAFFERATA,HARRISTIMOTHY@YAHOO.COM +1878,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,30-Jan-21,ANTHONY_GUTIERREZ,M,26-Oct-11,COSTA_GRANDE,ANTHONYJOHNSON@YAHOO.COM +1879,UNIVERSIDAD_DEL_SALVADOR,AGRONOMÍA,30-Jan-21,BARBARA_SMITH,F,23-May-31,RAFAEL_CASTILLO,RICHARDSONMONICA@HOTMAIL.COM +1880,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_POLÍTICA_,31-Jan-21,KRISTA_ADAMS,F,09-May-44,EL_MOLLE,HMORGAN@YAHOO.COM +1881,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,31-Jan-21,DANNY_CRAWFORD,M,19-Apr-90,ARROYO_PASTORA,NMUELLER@HOTMAIL.COM +1882,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ADMINISTRACIÓN_,31-Jan-21,COREY_THOMAS,M,28-Jun-90,CAÑADA_SECA,AHOPKINS@HOTMAIL.COM +1883,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_DE_LA_COMPUTACIÓN,31-Jan-21,JOE_WATTS,M,20-Feb-63,ALDEA_SANTAFECINA,DENNISDOMINIQUE@HOTMAIL.COM +1884,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,31-Jan-21,KATHY_LOPEZ,F,27-Mar-90,ALPACHIRI,MURPHYMANUEL@HOTMAIL.COM +1885,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,31-Jan-21,MEGHAN_NELSON,F,12-Apr-89,COLONIA_BERLIN,VKHAN@HOTMAIL.COM +1886,UNIVERSIDAD_DEL_SALVADOR,FARMACIA,31-Jan-21,ROBERT_ORTEGA,M,22-Sep-95,COLONIA_VALDEZ,MCDANIELMARK@YAHOO.COM +1887,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_ARTES,31-Jan-21,TYLER_ALLEN,M,25-Apr-13,JUAN_MARIA_GUTIERREZ,UTURNER@GMAIL.COM +1888,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_RELACIONES_DEL_TRABAJO_,31-Jan-21,MICHELLE_FRANKLIN,F,03-Jan-37,CAMINERA,QWEAVER@HOTMAIL.COM +1889,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIA_Y_TECNOLOGÍA_DE_ALIMENTOS,31-Jan-21,DEBBIE_ENGLISH,F,22-Oct-81,ALGARROBAL_ABAJO,LISAFLORES@HOTMAIL.COM +1890,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,01-Feb-21,ADAM_BREWER,M,04-Jun-11,AVELLANEDA,LOWECATHERINE@HOTMAIL.COM +1891,UNIVERSIDAD_DEL_SALVADOR,CIENCIAS_VETERINARIAS,01-Feb-21,CARMEN_WILLIAMS,F,12-Sep-04,CORONEL_CHARLONE,JRODRIGUEZ@YAHOO.COM +1892,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,01-Feb-21,JENNIFER_DURAN,F,29-Aug-84,RIO_TALA,CAITLINYOUNG@YAHOO.COM +1893,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_MUSICOTERAPIA,01-Feb-21,TYLER_PAGE,M,06-Jun-19,25_DE_MAYO,TIFFANYMURPHY@YAHOO.COM +1894,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_CIENCIAS_GEOLÓGICAS,01-Feb-21,MICHAEL_WRIGHT,M,22-Feb-13,ALVAREZ_JONTE,WALTERLARRY@YAHOO.COM +1895,UNIVERSIDAD_DEL_SALVADOR,TÉCNICO_PARA_BIOTERIOS_,01-Feb-21,SUSAN_BARKER,F,04-Nov-04,12_DE_OCTUBRE,BERGERALEJANDRA@GMAIL.COM +1896,UNIVERSIDAD_DEL_SALVADOR,DISEÑO_DE_IMAGEN_Y_SONIDO,01-Feb-21,AUDREY_HAYNES,F,19-Aug-40,COLONIA_DR_GDOR_UDAONDO,HALLKATELYN@YAHOO.COM +1897,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_GESTIÓN_DE_AGROALIMENTOS,01-Feb-21,VINCENT_WELCH,M,01-Apr-09,CASBAS,GARRETT30@YAHOO.COM +1898,UNIVERSIDAD_DEL_SALVADOR,ACTUARIO_,01-Feb-21,KYLE_MELENDEZ,M,14-May-15,9_DE_ABRIL,EMILYCURRY@HOTMAIL.COM +1899,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_SOCIOLOGÍA_,01-Feb-21,MELISSA_MCCLURE,F,21-Dec-16,CAILOMUTA,RICKEY75@GMAIL.COM +1900,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_MECÁNICA,01-Feb-21,MICHAEL_MOSES,M,04-Jan-07,CABO_SAN_FERMIN,LAURA79@HOTMAIL.COM +1901,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_KINESIOLOGÍA_Y_FISIATRÍA,01-Feb-21,LISA_JOHNSON,F,17-Aug-89,LA_DULCE,ABIGAIL27@YAHOO.COM +1902,UNIVERSIDAD_DEL_SALVADOR,LICENCIATURA_EN_PRODUCCIÓN_DE_BIOIMAGENES,01-Feb-21,PAMELA_CLARK,F,06-Jun-12,RICARDO_ROJAS,WILLIAM03@HOTMAIL.COM +1903,UNIVERSIDAD_DEL_SALVADOR,INGENIERÍA_EN_INFORMÁTICA,01-Feb-21,RENEE_WALKER,F,09-Mar-43,ESCUELA_AGRICOLA_DON_BOSCO,CBROWN@YAHOO.COM diff --git a/include/GBUNComahue.sql b/include/GBUNComahue.sql new file mode 100644 index 00000000..d9e436de --- /dev/null +++ b/include/GBUNComahue.sql @@ -0,0 +1 @@ +select universidad , carrera , fecha_de_inscripcion,fc."name", sexo ,fecha_nacimiento,codigo_postal ,correo_electronico from flores_comahue fc where (universidad = 'UNIV. NACIONAL DEL COMAHUE' and (fecha_de_inscripcion between '2020-09-01' and '2021-02-01' )) order by fecha_de_inscripcion asc; diff --git a/include/GBUNSalvador.sql b/include/GBUNSalvador.sql new file mode 100644 index 00000000..2930d7a7 --- /dev/null +++ b/include/GBUNSalvador.sql @@ -0,0 +1,2 @@ +select universidad , carrera , fecha_de_inscripcion,nombre , sexo ,fecha_nacimiento,localidad ,email from salvador_villa_maria svm where (universidad = 'UNIVERSIDAD_DEL_SALVADOR' and (to_date(fecha_de_inscripcion,'DD-Mon-YY') between '2020-09-01' and '2021-02-01')) order by to_date(fecha_de_inscripcion,'DD-Mon-YY') asc; + diff --git a/plugins/connectionDag.py b/plugins/connectionDag.py new file mode 100644 index 00000000..15417141 --- /dev/null +++ b/plugins/connectionDag.py @@ -0,0 +1,74 @@ +import os +# from decouple import config +from decouple import config +from datetime import timedelta +import logging +import decouple + +import logging.config +from sqlCommandB import createPath,identExt + + +def configDag(): + + + default_args = { + 'owner': 'Breyner', + 'retries': 5, + 'retry_delay': timedelta(minutes=10), + } + + POSTGRES_CONN_ID = decouple.config("POSTGRES_CONN_ID") + ACCESS_KEY = decouple.config("ACCESS_KEY") + SECRET_ACCESS_KEY = decouple.config("SECRET_ACCESS_KEY") + AWS_S3_CONN_ID = decouple.config("AWS_S3_CONN_ID") + BUCKET = decouple.config("BUCKET") + # print(".ENv connect->", POSTGRES_CONN_ID) + # logger.info(".ENv connect-> %s", POSTGRES_CONN_ID) + # logger.info("data: %s", name) + return default_args, POSTGRES_CONN_ID,ACCESS_KEY,SECRET_ACCESS_KEY,AWS_S3_CONN_ID,BUCKET + + +# def configLog(name): +def configLog(name): + # print("Configlog") + + + pathconf = createPath("assets") + pathRoot = identExt(pathconf, ".cfg") + # print(pathconf) + # print(pathRoot) + n = pathRoot.index(name+".cfg") + pathRoot = pathRoot[n] + path = pathconf+"/"+pathRoot + # print(path) + + logging.config.fileConfig(path,disable_existing_loggers=False) + + logger = logging.getLogger(name) + + return logger + + + + # print(logger) + + # # log something + # logging.info("congfilog prueba") + # logger.debug('debug message') + # logger.info('info message') + # logger.warn('warn message') + # logger.error('error message') + # logger.critical('critical message') + + + + + + + +# print(POSTGRES_CONN_ID) +if __name__ == "__main__": + configDag() + configLog("GBUNComahue_dag_elt") + # print(d,s) diff --git a/plugins/dataTrasB.py b/plugins/dataTrasB.py new file mode 100644 index 00000000..694228fb --- /dev/null +++ b/plugins/dataTrasB.py @@ -0,0 +1,393 @@ + + +from sqlCommandB import createPath, csvFile, txtFile + +import pandas as pd +import random +from datetime import date +import csv +import datetime + + +def sepDat(data, sepv): + N = len(data) + dat_sep = [data[i].split(sepv) for i in range(N)] + dat_sep = pd.Series(dat_sep) + return dat_sep + + +def dateInsc(da): + td = date.today() + c = td.year - 1918 + nc = random.randrange(0, 15, 1) + if c > 15: + c = td.year-1-nc + s = str(c)+"-"+da[1]+"-"+da[2] + return s + + +def dateConvertI(da): + + # + s = "20"+da[2]+"-"+da[1]+"-"+da[0] + fecha = datetime.datetime.strptime( + "{0}".format(s), "%Y-%b-%d").strftime("%Y-%m-%d") + return fecha + + +def saveTxt(dat_file, df): + path_datasets = createPath("datasets") + dat_file_name = path_datasets+'/'+dat_file + df.to_csv(dat_file_name, sep="\t", quoting=csv.QUOTE_NONE, + escapechar=" ", index=False) + + +def dateConvert(da): + num = int(da[2]) + if num > 5: + rf = random.randrange(5, 40, 1) +# print(rf) + rf = rf + if rf >= 0 and rf < 5: + # print(rf) + year = "200"+str(rf) + else: + if rf < 10: + year = "199"+str(rf) + else: + year = "19"+str(rf) + else: + year = "200"+str(num) + + s = year+"-"+da[1]+"-"+da[0] + fecha = datetime.datetime.strptime( + "{0}".format(s), "%Y-%b-%d").strftime("%Y-%m-%d") + return fecha + + +def sepDat(data, sepv): + N = len(data) + dat_sep = [data[i].split(sepv) for i in range(N)] + dat_sep = pd.Series(dat_sep) + return dat_sep + + +def uniqueR(datR): + + sd3 = [dat for dat in datR if len(dat) <= 3] + + sd3 = list(set(sd3)) + return sd3 + + +def uniqueI(datR): + + datR = list(datR) + + datR.append('MS.') + datR.append('MISS') + mr = list(set(datR)) + + return mr + + +def calculateAge(dat): + birthdate = date.fromisoformat(dat) + today = date.today() + age = today.year - birthdate.year - ((today.month, today.day) < + (birthdate.month, birthdate.day)) + + if age > 40: + age = random.randrange(17, 40, 2) + elif age < 17: + age = random.randrange(17, 40, 2) + return age + + +def concatDat(dat): + dat = dat.split('_') + cadena = "" + # for i in dat: + # cadena =cadena+" "+i + # i = cadena + cadena = " ".join(dat) + return cadena + + +def rnam(df): + f = " ".join(df) + return f + + +def data_final(df1): + names1 = df1[df1.columns[3]] + path_cp = createPath("assets") + file_cp = csvFile(path=path_cp, select="codigos_postales.csv") + + dfp = pd.read_csv(file_cp) + names = names1 + + if "_" in names[0]: + names_e = sepDat(names, "_") + elif " " in names[0]: + names_e = sepDat(names, " ") + else: + names_e = sepDat(names, " ") + + name = pd.Series(names_e) + + nl = pd.Series(list(map(len, name))) + + dat4 = nl[:] == 4 + dat3 = nl[:] == 3 + dat2 = nl[:] == 2 + + i = nl[dat4].index + k = nl[dat3].index + j = nl[dat2].index + + datindex4 = list(i) + datindex3 = list(k) + datindex2 = list(j) + # names[i] + + # d4 = [print(names[datindex[i]]) for i in range(len(datindex))] + d4 = [name[datindex4[i]] for i in range(len(datindex4))] + + d3 = [name[datindex3[i]] for i in range(len(datindex3))] + + d2 = [name[datindex2[i]] for i in range(len(datindex2))] + + N34 = len(d4)+len(d3) + N3 = len(d3) + N4 = len(d4) + N2 = len(d2) + + Nt = N3+N4+N2 + + # d4 + + d4 = pd.DataFrame(d4) + + mr = d4[0].unique() + sd = d4[3].unique() + d4 = d4.drop(columns=[0, 3]) + + d4.columns = [df1.columns[3], df1.columns[4]] + + # print(N4 == len(d4)) + d4.index = datindex4 + + # d3 + + d3 = pd.DataFrame(d3) + sd3 = d3[2].unique() + sd3 = list(sd) + + sd3 = uniqueR(d3[2].unique()) + mr3 = uniqueI(mr) + d3.index = datindex3 + + # Join columns 3 to 2 + d = pd.DataFrame(columns=[1, 2]) + + na = [] + for i in range(len(mr3)): + mr0 = d3[0] == mr3[i] + d3t = d3[mr0] + nam = d3t.drop(columns=[0]) + + d = pd.concat([nam, d], sort=True) + + dat3 = d + + d.columns = [0, 1] + e = pd.DataFrame(columns=[0, 1]) + na = [] + for i in range(len(sd3)): + mr0 = d3[2] == sd3[i] + d3t = d3[mr0] + # print(d3t) + nam = d3t.drop(columns=[2]) + # print(nam) + + d = pd.concat([nam, d], sort=True) + e = pd.concat([nam, e], sort=True) + + d.columns = [df1.columns[3], df1.columns[4]] + d3 = d + N3 == len(d3) + N4 == len(d4) + + d34 = pd.concat([d3, d4]) + + N34 == len(d34) + + # d2 + + d2 = pd.DataFrame(d2) + d2.index = datindex2 + + d2.columns = [df1.columns[3], df1.columns[4]] + + d234 = pd.concat([d34, d2]) + # d234.sort_index() + # print(len(d234)== Nt) + + d234 = d234.reset_index() + d234 = d234.sort_values(by="index") + d234.index = d234['index'] + + df1['first_name'] = d234['first_name'] + df1['last_name'] = d234['last_name'] + + df1.gender = df1.gender.replace({"M": "male", "F": "female"}) + + # df1.age =df1.age.apply(calculateAge) + + N = len(df1.university) + if "_" in df1.university[0]: + dat_uni = sepDat(df1.university, "_") + df1.university = df1.university.apply(concatDat) + + if "_" in df1.career[0]: + dat_car = sepDat(df1.career, "_") + df1.career = df1.career.apply(concatDat) + + if df1.postal_code[0] == None: + if "_" in df1.location[0]: + dat_car = sepDat(df1.location, "_") + df1.location = df1.location.apply(concatDat) + + for i in range(N): + + pos = dfp.localidad == df1.location[i] + find_loc = dfp[pos] + + daf = find_loc + + da = daf.index + + n = len(da) + rf = random.randrange(0, n, 1) + daf.iloc[rf].values[0] + + df1.postal_code[i] = daf.iloc[rf].values[0] + else: + # print("post") + post = df1.postal_code.unique() + + for i in post: + + cp = i + find_cp = dfp['codigo_postal'] == cp + find_localidad = dfp[find_cp]['localidad'] + find_localidad = find_localidad.values[0] + valP = df1.postal_code == cp + pos = df1[valP] + df1.loc[pos.index, 'location'] = find_localidad + + if df1.age.dtype == 'object': + try: + df1.age = df1.age.apply(calculateAge) + + except: + datfecha = df1.age.values + + da = sepDat(datfecha, "-") + + das = da.apply(dateConvert) + + df1.age = das.apply(calculateAge) + datI = df1.inscription_date.values + + da = sepDat(datI, '-') + + try: + df1.inscription_date = da.apply(dateConvertI) + except: + df1.inscription_date = df1.inscription_date + + df1.postal_code = df1.postal_code.astype('int64') + dob = df1.select_dtypes(include=['object']) + obc = dob.columns + for i in obc: + df1[i] = df1[i].str.lower() + + dg = df1.career.str.split() + + + df1.career = dg.apply(rnam) + return df1 + + +def data_transform(data): + + name_dat = data.split("/") + name_dat = name_dat[-1].split("_") + print(name_dat) + name_dat = name_dat[0] + print(name_dat) + ext = "_process.txt" + dat_file_name = name_dat+ext + print(dat_file_name) + + df = pd.read_csv(data) + ds = pd.Series(['university', 'career', 'inscription_date', 'first_name', + 'last_name', 'gender', 'age', 'postal_code', 'location', 'email']) + +# ds = pd.DataFrame(['university','career','inscription_date','first_name','last_name','gender','age','postal_code','location','email']) + + ds = ['university', 'career', 'inscription_date', 'first_name', + 'last_name', 'gender', 'age', 'postal_code', 'location', 'email'] + + df.drop(columns=df.columns[0], inplace=True) + + col = df.columns +# print(len(col),":",len(ds)) + + lastname = ds[4] + + df.insert(4, lastname, 4, allow_duplicates=False) + text1 = "localidad" + text2 = "codigo_postal" + + df.head() + col = df.columns +# print(len(col),":",len(ds)) + + colL = list(col) + + if text2 in col: + # print(text2) + n = colL.index(text2) +# print(n) + + location = ds[n+1] +# print(location) + df.insert(n+1, location, 2, allow_duplicates=False) + df.head() + + elif text1 in col: + # print(text1) + n = colL.index(text1) +# print(n) + location = ds[n] +# print(location) + df.insert(n, location, None, allow_duplicates=False) + df.head() + + df.columns = ds + col = df.columns + + dataFinal = data_final(df) + # print(dat_file_name) + + saveTxt(dat_file_name, dataFinal) + + +if __name__ == "__main__": + + # data = "./files/GBUNComahue_select.csv" + data = "./files/GBUNSalvador_select.csv" + data_transform(data) diff --git a/plugins/sqlCommandB.py b/plugins/sqlCommandB.py new file mode 100644 index 00000000..152f8fef --- /dev/null +++ b/plugins/sqlCommandB.py @@ -0,0 +1,87 @@ + +import os +import pandas as pd +import logging + + +def identExt(path,ext): + contenido = os.listdir(path) + # print("conte:") + # logging.info(contenido) + # print(contenido) + data = [] + for fichero in contenido: + if os.path.isfile(os.path.join(path, fichero)) and fichero.endswith(ext): + data.append(fichero) + return data + + + +def createPath(target): + path = os.getcwd() + contenido = os.listdir(path) + # print(contenido) + indexI = contenido.index(target) + endpoint = contenido[indexI] + path = path+'/'+endpoint + return path + +def csvFile(path,select): + # logging.info('Select_csv') + csv = identExt(path,'.csv') + + n = csv.index(select) + + selectCsv = csv[n] + return path+'/'+selectCsv + + +def txtFile(path, select): + # logging.info('Select_txt') + txt = identExt(path, '.txt') + + n = txt.index(select) + + selectTxt = txt[n] + return path+'/'+selectTxt + + + + + + +def sqlCommand(file,point): + + # logging.info('create_command_sql') + # print("OS-path:") + # print(os.getcwd()) + path = createPath(point) + # print("path____") + # print(path) + sql = identExt(path,'.sql') + # print(sql) + # print(path) + # print(sql[0]) + n = sql.index(file) + fd = open(path+'/'+sql[n], 'r') + sqlFile = fd.read() + fd.close() + # # print(sqlFile) + # sqlcomands = sqlFile.split(';') + # sqlcomands.pop() + sqlCommands =sqlFile + # print(sqlcomands) + # print(len(sqlcomands)) + + # print(sqlcomands) + return sqlCommands + + +if __name__ == '__main__': + + var = sqlCommand(path='Skill-Up-DA-c-PythonG1\include', + file='GBUNSalvador.sql') + + print(var) + + # print(contenido) diff --git a/requirements.txt b/requirements.txt new file mode 100644 index 00000000..45404a56 --- /dev/null +++ b/requirements.txt @@ -0,0 +1,4 @@ +apache-airflow-providers-postgres[amazon] +python-decouple==3.6 +python-dotenv==0.21.0 +dag-factory \ No newline at end of file